Unfortunately due to lack of commercial feasibility, the SkyBLAST service has been suspended from December 1st, 2025.
All subscriptions for paid accounts have been paused. For further information or enquiries, please email [email protected]

PREDICTED: Drosophila takahashii uncharacterized protein


LOCUS       XM_070218603            3192 bp    mRNA    linear   INV 09-DEC-2024
            (LOC138913805), mRNA.
ACCESSION   XM_070218603
VERSION     XM_070218603.1
DBLINK      BioProject: PRJNA1194641
KEYWORDS    RefSeq; includes ab initio.
SOURCE      Drosophila takahashii
  ORGANISM  Drosophila takahashii
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NC_091683) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI RefSeq
            Annotation Status           :: Full annotation
            Annotation Name             :: GCF_030179915.1-RS_2024_12
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 10.3
            Annotation Method           :: Gnomon; cmsearch; tRNAscan-SE
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            Annotation Date             :: 12/07/2024
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio :: 100% of CDS bases
            ##RefSeq-Attributes-END##
FEATURES             Location/Qualifiers
     source          1..3192
                     /organism="Drosophila takahashii"
                     /mol_type="mRNA"
                     /strain="IR98-3 E-12201"
                     /db_xref="taxon:29030"
                     /chromosome="X"
                     /sex="female"
                     /tissue_type="Whole fly"
                     /dev_stage="Adult fly"
                     /collected_by="Originally obtained from EHIME-Fly"
     gene            1..3192
                     /gene="LOC138913805"
                     /note="uncharacterized LOC138913805; Derived by automated
                     computational analysis using gene prediction method:
                     Gnomon. Supporting evidence includes similarity to: 15
                     Proteins"
                     /db_xref="GeneID:138913805"
     CDS             1..3192
                     /gene="LOC138913805"
                     /codon_start=1
                     /product="uncharacterized protein"
                     /protein_id="XP_070074704.1"
                     /db_xref="GeneID:138913805"
                     /translation="MDQFKLLKAARSRAKASITRLLTASQDPRAGSNWELDEITVSLE
                     RLNNVWKEFETISDQMALYDGEEGYIDPAIDNERYEDKYMQASTLFHTIKRRCQSSNE
                     SDREGSNGRQSGNIDDAASSSSGLGTESLARFLQQQQELNERLAEQQSTFLRANSAAN
                     VMHNELPKIHIKVFSGDYKEWPAFKNIFESTIHSKQHLTAIQKFHYLKTYITGEAADL
                     IRHMPITDAAYEAAWSCLTERYNRPRHIVNTLLETFVNLPSTSRADVAVLRKVTDGAT
                     EIVRGLDAAGQTNRDCWIIHFILAKIDAETRRKWIEGSRVLESPSVDDLLKFLDRRCE
                     EFELIKSESDIDFKVGAPQLSKAKRSSHALVSMEDNACVKCNSKEHKIYGCPKFAEAS
                     IDQRRTFVKTKSLCFNCLKLGHVSRKCESKFTCKICHNRHYSLLHADIPGSQAAVTTT
                     QPHTDERHVSSAPGDATVTISHIARAQAAPTAESLCNGSTTATQPQGLRKSAFPTALV
                     FVKTAKGSHITCRVLLDSGSELSYISERCVQALGLSRSPSRIVVSGISSIKAETTRGC
                     STLDMQSRISDHTMKVRAHVLSKITSTLARHDIESSALKAFAGFELADSDYQSLAPVD
                     ILLGSDYVWTVFTGQKMFDIQGNIIAISTIFGWVITSIVTTGCSSTTTMHSAIDIDST
                     LRRFWELEDVNQEFHGKPEDDEVEQHFMKTHTRDSKGRYIVELPFKNSNEQFSDTLQG
                     ALARFRGVERRLKKDPDLHSKYVKFMREYLQLGHMRELSPGDIDKGKSFYLPHHPVIT
                     QKLRVVFDGSFKDTNGKSLNDALHIGPSILRNLFSICMRFRMFKFVFSADIVKMYRQI
                     LVAANHCSYQRIVWREDESTPIKHYELSTVTYGTSSAPFLAVRVLDQLANDHQQEFPT
                     AARILKEQFYVDDVLTGAPTEEELIYNQKELIQLMKCAGMELGKWVSNSSRITDRATS
                     TTEVQGKGSTPTSKVLGIHWDPEEDTLSYKVCLAPNPDNTKRQVLSDVARSTVFDPLG
                     ILSPVVVQFKILFQELWLLDLGWDTELPPKIAD"
     misc_feature    520..957
                     /gene="LOC138913805"
                     /note="Protein of unknown function (DUF1759); Region:
                     DUF1759; pfam03564"
                     /db_xref="CDD:281552"
     misc_feature    <1099..>1302
                     /gene="LOC138913805"
                     /note="Arginine methyltransferase-interacting protein,
                     contains RING Zn-finger [Posttranslational modification,
                     protein turnover, chaperones / Intracellular trafficking
                     and secretion]; Region: AIR1; COG5082"
                     /db_xref="CDD:227414"
     misc_feature    1522..2013
                     /gene="LOC138913805"
                     /note="Cellular and retroviral pepsin-like aspartate
                     proteases; Region: pepsin_retropepsin_like; cl11403"
                     /db_xref="CDD:472175"
     misc_feature    order(1573..1575,1579..1581,1585..1587,1654..1662)
                     /gene="LOC138913805"
                     /note="inhibitor binding site [active]"
                     /db_xref="CDD:133136"
     misc_feature    1573..1581
                     /gene="LOC138913805"
                     /note="catalytic motif [active]"
                     /db_xref="CDD:133136"
     misc_feature    1573..1575
                     /gene="LOC138913805"
                     /note="Catalytic residue [active]"
                     /db_xref="CDD:133136"
     misc_feature    order(1654..1665,1675..1686)
                     /gene="LOC138913805"
                     /note="Active site flap [active]"
                     /db_xref="CDD:133136"
     misc_feature    2362..2991
                     /gene="LOC138913805"
                     /note="Reverse transcriptase (RTs) in retrotransposons.
                     This subfamily represents the RT domain of a
                     multifunctional enzyme. C-terminal to the RT domain is a
                     domain homologous to aspartic proteinases (corresponding
                     to Merops family A17) encoded by...; Region: RT_pepA17;
                     cd01644"
                     /db_xref="CDD:238822"
     misc_feature    order(2542..2559,2662..2667,2770..2772,2776..2781,
                     2962..2967)
                     /gene="LOC138913805"
                     /note="putative active site [active]"
                     /db_xref="CDD:238822"
     misc_feature    order(2542..2559,2662..2664,2776..2778)
                     /gene="LOC138913805"
                     /note="putative NTP binding site [chemical binding]; other
                     site"
                     /db_xref="CDD:238822"
     misc_feature    2665..2667
                     /gene="LOC138913805"
                     /note="putative nucleic acid binding site [nucleotide
                     binding]; other site"
                     /db_xref="CDD:238822"
     misc_feature    3034..>3189
                     /gene="LOC138913805"
                     /note="Pao retrotransposon peptidase; Region:
                     Peptidase_A17; pfam05380"
                     /db_xref="CDD:461634"
ORIGIN      
        1 atggatcagt ttaagcttct aaaggcagca agaagtcgtg cgaaggcaag cattacgcgt
       61 ttgctaacgg cgtcacaaga tccacgtgcg ggatcaaatt gggaattgga tgaaatcaca
      121 gtctcattgg aaaggctcaa caacgtttgg aaggagtttg agaccattag cgatcaaatg
      181 gccctttatg atggagaaga ggggtacatc gatccagcca tcgacaacga gaggtacgag
      241 gataagtaca tgcaagcaag caccttgttt cacaccatta aacggcgctg tcagtcatcc
      301 aatgagagcg acagagaagg cagcaacggt aggcaatctg gcaacattga cgatgccgca
      361 tcaagttcat caggattggg aaccgaaagc cttgctcgtt ttctacaaca acagcaggag
      421 ctgaatgagc gtttagctga gcagcaatca acatttttga gagcaaactc cgcagcaaat
      481 gtaatgcaca acgagctgcc aaaaatccac atcaaggtgt tttctggtga ctacaaagag
      541 tggccagcct ttaaaaacat ctttgagagt acgatccaca gcaagcagca tttgacagca
      601 atacaaaagt tccactactt aaaaacgtac attactgggg aagcagcgga cttgattcgt
      661 catatgccaa taacggatgc tgcttatgag gctgcttgga gctgcctaac tgagcgatac
      721 aacagaccac gtcacattgt caacactcta ctggaaacgt ttgtaaatct cccttcgaca
      781 tccagggcag atgttgcagt tctgcgcaag gtgaccgacg gagccacgga gattgtacga
      841 ggattggatg cagcagggca aactaacagg gactgctgga tcatacactt cattctggcc
      901 aaaatcgacg ctgaaactcg acgcaaatgg attgagggaa gccgggtact tgaatctccg
      961 tctgtggatg atttactcaa gtttttagac cgacgctgcg aggaattcga gctcatcaaa
     1021 agtgagtcag acatagactt caaggttggc gcaccacaac tgagcaaagc aaagcgttcg
     1081 tcccatgcct tagtatcgat ggaagataat gcttgtgtga aatgtaactc taaggagcac
     1141 aagatctacg gttgcccaaa gtttgctgaa gcatcgatcg accagagacg cacatttgta
     1201 aagacaaaat ccttgtgttt caactgtctt aagcttgggc atgtctcacg caagtgtgaa
     1261 tccaaattca catgcaagat ttgccataat cgccattact cgctgctaca tgcagatatt
     1321 cctggatcgc aagccgctgt gaccacgaca cagccacata ctgatgaaag gcacgtctca
     1381 agcgctcccg gagatgctac ggtgaccatc agccatattg ctcgcgcgca agcggctccc
     1441 acagctgagt ccttgtgcaa cggatcaaca acggctacac agccccaagg gctaaggaaa
     1501 agtgcatttc caacagctct ggtatttgta aaaaccgcaa aaggatcgca cattacatgt
     1561 cgggtacttt tggacagtgg ttcggaactg tcgtacatct cagagaggtg cgtacaggca
     1621 cttggtctgt cacgctcgcc ctcacgcatt gtagtgtctg gaatttcatc gatcaaggcg
     1681 gagacaacta gaggctgcag cacactggac atgcagtcaa ggatctcaga tcacacaatg
     1741 aaagtacgcg cacacgtact cagcaaaatt acctccacgt tagcaagaca cgatatcgag
     1801 tcctcagcac tcaaggcatt tgctggcttt gagcttgcgg attctgatta tcaatcgttg
     1861 gcgccagtcg atattctttt gggcagcgat tacgtttgga ccgtgttcac cggtcaaaag
     1921 atgttcgaca tccagggcaa catcatcgcc atttcgacca tttttggatg ggtcataaca
     1981 tctatcgtta ctaccggctg ttcatctaca acaacaatgc actcggctat tgacattgac
     2041 tcaacgcttc ggcgcttttg ggagctggag gatgtcaacc aggaattcca tgggaaacca
     2101 gaggacgatg aagttgaaca gcactttatg aaaacgcaca ctcgggactc caaggggcgt
     2161 tacatagtcg aacttccgtt caaaaactcc aacgaacagt tttcggatac tttacaagga
     2221 gcactggcaa gattcagggg tgtagaacgc cgcctaaaga aggaccccga tctgcactca
     2281 aagtatgtaa aatttatgcg tgaatacctt cagttaggac acatgcggga attatcgcca
     2341 ggcgacattg acaaagggaa aagcttttac ttgcctcatc atccagtaat tacccaaaag
     2401 ctaagggtag tatttgacgg ctcattcaag gatacgaatg gaaaatcctt aaacgatgct
     2461 ctacacattg gacccagcat tctccgaaac ctcttctcga tttgtatgcg tttcagaatg
     2521 tttaagttcg tcttttctgc agatattgtc aaaatgtatc gacaaatctt ggtggctgcc
     2581 aaccattgta gctatcagcg tattgtttgg agagaagatg aaagtacacc tatcaagcac
     2641 tatgagcttt ccacggtgac atatggcaca tctagtgcac cattcttggc agtaagagtc
     2701 ctggatcagt tagctaacga ccaccaacaa gagtttccca ccgctgcaag aatcttgaag
     2761 gagcagtttt atgtggacga cgtactgacg ggagcaccta cagaggagga gctaatttac
     2821 aatcaaaaag agctgatcca attaatgaaa tgtgcaggca tggaacttgg caaatgggtt
     2881 tcaaattcat cacgtataac tgatcgagct acttctacaa ccgaggtaca aggcaaagga
     2941 tccactccta catcaaaggt tcttggcatt cattgggatc cagaagagga tacgttatcc
     3001 tacaaagttt gccttgcacc aaatccggac aacaccaagc gccaagtgct gtctgacgta
     3061 gcacggagca ctgtctttga cccgctgggt attttgtcgc cagtggtggt gcagtttaaa
     3121 attctgttcc aagaattgtg gttactggat ctcggctggg acacggagct tcctccaaaa
     3181 attgctgact ag