Unfortunately due to lack of commercial feasibility, the SkyBLAST service has been suspended from December 1st, 2025.
All subscriptions for paid accounts have been paused. For further information or enquiries, please email [email protected]

PREDICTED: Drosophila takahashii uncharacterized protein


LOCUS       XM_070218599            4422 bp    mRNA    linear   INV 09-DEC-2024
            (LOC123003500), mRNA.
ACCESSION   XM_070218599
VERSION     XM_070218599.1
DBLINK      BioProject: PRJNA1194641
KEYWORDS    RefSeq; includes ab initio.
SOURCE      Drosophila takahashii
  ORGANISM  Drosophila takahashii
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NC_091683) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI RefSeq
            Annotation Status           :: Full annotation
            Annotation Name             :: GCF_030179915.1-RS_2024_12
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 10.3
            Annotation Method           :: Gnomon; cmsearch; tRNAscan-SE
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            Annotation Date             :: 12/07/2024
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio :: 100% of CDS bases
            ##RefSeq-Attributes-END##
FEATURES             Location/Qualifiers
     source          1..4422
                     /organism="Drosophila takahashii"
                     /mol_type="mRNA"
                     /strain="IR98-3 E-12201"
                     /db_xref="taxon:29030"
                     /chromosome="X"
                     /sex="female"
                     /tissue_type="Whole fly"
                     /dev_stage="Adult fly"
                     /collected_by="Originally obtained from EHIME-Fly"
     gene            1..4422
                     /gene="LOC123003500"
                     /note="uncharacterized LOC123003500; Derived by automated
                     computational analysis using gene prediction method:
                     Gnomon. Supporting evidence includes similarity to: 11
                     Proteins"
                     /db_xref="GeneID:123003500"
     CDS             1..4422
                     /gene="LOC123003500"
                     /codon_start=1
                     /product="uncharacterized protein"
                     /protein_id="XP_070074700.1"
                     /db_xref="GeneID:123003500"
                     /translation="MKTVPSIVLRLVREGSRLTSHVVSHGVWKEFNEFGDANAVHEEV
                     EGYVDPEIDNAIYEEKYLRAIAILKDRSDALQPSTSTGITNGSNGLHSNNDAIVNLLQ
                     QNQQLFERLAANQASSSTPVQVGGDVTLANLSSVFAANSNQSELPKIQIKRFSGNYTE
                     WPSFKDIYENTIHNKQHLSNTQKFHHLKTLLVDEAANLVRHLAITETAYNTAWERLKE
                     RYNHPRHIVNSFLEQFMSLPTTTKVDASILRKVSDGANEIIRGLDAVNQMGRDCWIIY
                     LALEKLNADTRRRWIERSMDTDSPTLEEFFKFLDSRCEELELSKRELATGGKTTTHAE
                     KPKRVTQSMVAVEGSGCTKCNSTEHTLYSCQQFLDMSGMQRRSFVKEKSLCYNCLRPG
                     HGVSKSKSTYKCRQCKGNHHSLLHVQANPQAIGNLAQIAGEDERNTSASNNTSVTLSH
                     FAQGEGTQSVVCAQGTAKSAQESEVKRSILTTAMVYVQNAKGDHVTCRLLLDTGSELS
                     YVSERCIQALGLTRSASRILVTGISSVKADTTRGCSTLHIKSRISEDQLVVYAHVLGR
                     ITSSLERQNIDASALKVFKDLQLADTEFNTNSPVDILLGSEHVWSVFTGRKMFDNKVD
                     IGATLQKFWELENVQSSAKLEPEDDQVEKHFLATHSRDVNGKHIVELPFNTENPEFGG
                     TLQGALKRFKSAERRLQQNEQLRPSIQRDLFAVCLRFRMYKFAFSADIVKMFRQIWVN
                     EKHRNFQKIVWREDPSDPIKHFQLCTVTYGTSCAPFLAVRVLEQLAIDHQEEYPNASK
                     ILLEDFYVDDVLTGSNSEDELLRNRNELVELMSRANLELGKWVSNTPCIQTDNSDTQS
                     AQISPVKVLGLYWHPGNDVLTYNVGLAANPDCTKRQVLSDVSRIFDPLGLLAPIVIQF
                     KILFQKLWLLNLDWDDPLPTKLADNWLKWRADLDTLQKFRLPRFVHNDPDNIELHGFS
                     DASTKAYAAVVYSRVTNDDGSISVSIVAAKTRVAPLKQQSLPRLELCAALLLSQLIRS
                     ITSGLRHKNITVFGWSDSSIVLSWLSYAPAQLKTFVGNRTSEILDTIPRSAWRHVDSK
                     TNPADCASRGLMAADLIDFHLWWNGPQWLRDKDQYLVKLNDSRFGLSLTDKRIQGEVK
                     SNCLATLTEATQIHLLDELIERVSSWIKLVHIVGYVMRFIQRTRNPSREKVSGALSFD
                     EIKAARILCIKHAQGCFKDDYQLLLGKKPLKNRSQLVKLAPIIDENDLLRVGERLHHS
                     QLSRDAKHPVLLPKTHRISKLILEHEHRVNHHPGVSSLFVIVRQKFWIFGARNLIRKI
                     THDCLACFRQRSHTSQQQMANLPSVRITQALPFIHTGCDYAGPILLKDAKVRKPRISK
                     GYICLFVCMVTSAIHLELATDLTTETFLAALRRFISLRGKCSKIYSDNGTNFIGAKRS
                     LDEMQELLSSQTHKDTVSSTLADDGIQWNHRKLNAHL"
     misc_feature    460..897
                     /gene="LOC123003500"
                     /note="Protein of unknown function (DUF1759); Region:
                     DUF1759; pfam03564"
                     /db_xref="CDD:281552"
     misc_feature    1453..1929
                     /gene="LOC123003500"
                     /note="Cellular and retroviral pepsin-like aspartate
                     proteases; Region: pepsin_retropepsin_like; cl11403"
                     /db_xref="CDD:472175"
     misc_feature    order(1504..1506,1510..1512,1516..1518,1585..1593)
                     /gene="LOC123003500"
                     /note="inhibitor binding site [active]"
                     /db_xref="CDD:133136"
     misc_feature    1504..1512
                     /gene="LOC123003500"
                     /note="catalytic motif [active]"
                     /db_xref="CDD:133136"
     misc_feature    1504..1506
                     /gene="LOC123003500"
                     /note="Catalytic residue [active]"
                     /db_xref="CDD:133136"
     misc_feature    order(1585..1596,1606..1617)
                     /gene="LOC123003500"
                     /note="Active site flap [active]"
                     /db_xref="CDD:133136"
     misc_feature    2101..2622
                     /gene="LOC123003500"
                     /note="conserved catalytic core domain of RNA-dependent
                     RNA polymerase (RdRp) from the positive-sense
                     single-stranded RNA [(+)ssRNA] viruses and closely related
                     viruses; Region: ps-ssRNAv_RdRp-like; cl40470"
                     /db_xref="CDD:477363"
     misc_feature    order(2185..2202,2305..2310,2413..2415,2419..2424,
                     2608..2613)
                     /gene="LOC123003500"
                     /note="active site"
                     /db_xref="CDD:238185"
     misc_feature    order(2185..2202,2305..2307,2419..2421)
                     /gene="LOC123003500"
                     /note="NTP binding site [chemical binding]; other site"
                     /db_xref="CDD:238185"
     misc_feature    2308..2310
                     /gene="LOC123003500"
                     /note="nucleic acid binding site [nucleotide binding];
                     other site"
                     /db_xref="CDD:238185"
     misc_feature    2665..3144
                     /gene="LOC123003500"
                     /note="Pao retrotransposon peptidase; Region:
                     Peptidase_A17; pfam05380"
                     /db_xref="CDD:461634"
     misc_feature    3820..3999
                     /gene="LOC123003500"
                     /note="Integrase zinc binding domain; Region:
                     Integrase_H2C2; pfam17921"
                     /db_xref="CDD:465569"
ORIGIN      
        1 atgaagacag ttcccagcat cgttctacgg ttggttaggg agggctcaag gctaacatca
       61 cacgttgtct ctcatggtgt ttggaaggag ttcaacgagt tcggcgatgc caatgctgtc
      121 cacgaggaag tagaaggtta cgtcgatccg gagatcgata atgcgattta cgaagaaaag
      181 tacctaaggg cgatcgcaat tctcaaggac agaagtgatg ctctacaacc gagtacatct
      241 acaggcatta cgaatggcag caacggtctg cattccaaca acgacgcaat tgtcaatttg
      301 ctgcaacaaa accaacaact atttgagcga ctggctgcaa atcaggctag ttcgagcacg
      361 ccggttcaag ttggtggtga cgtcactttg gcgaatttaa gttcggtatt cgcggcgaat
      421 tctaatcaga gcgaattgcc aaaaattcaa atcaagcggt tctctggcaa ctacacagag
      481 tggccctcct ttaaagacat ctatgaaaac acaattcata acaagcaaca tttgtccaac
      541 acacagaagt tccatcactt gaaaacactt cttgttgatg aggctgccaa cttggtacgg
      601 cacttggcca ttacggagac tgcttacaac acagcttggg aacgtcttaa ggagaggtac
      661 aatcatccac ggcacattgt aaactcattt ttggagcagt ttatgagcct accaacaact
      721 acaaaggtag atgcatcaat tctacgaaag gtgtcagacg gagcaaacga aattattcgc
      781 ggattggatg cggtcaacca gatgggacgc gattgctgga ttatctatct ggccctggag
      841 aaacttaacg ctgacacgcg gcgcaggtgg attgagcgca gcatggacac ggattcacca
      901 actctcgagg aattcttcaa gtttctcgat tctcgttgcg aggaactgga gctgagtaaa
      961 agggagcttg ctactggtgg caaaacaaca acacatgcag aaaaaccaaa aagggtcaca
     1021 caatcgatgg ttgcggtcga aggcagtggc tgcaccaaat gtaattctac agaacacact
     1081 ctgtacagct gtcagcagtt cttggatatg tccgggatgc agaggcgatc cttcgtaaag
     1141 gagaaatcac tgtgctacaa ctgcttgcga cctggtcatg gggtcagcaa gagcaagtcg
     1201 acatacaaat gtaggcaatg caagggaaat catcactccc ttcttcatgt ccaagcgaat
     1261 ccacaggcta ttgggaatct tgcccagata gcaggggagg acgagcgaaa cacaagcgcg
     1321 tccaacaaca catcggtgac tctcagtcat ttcgcccaag gagagggcac tcaatcggtt
     1381 gtatgtgcac agggcactgc aaaatctgca caggaatcgg aagttaagcg aagcatatta
     1441 acaactgcca tggtttatgt tcaaaacgca aaaggtgacc acgtaacatg ccgtctctta
     1501 ttggacacgg gctcagagct ttcctacgta tccgagcgtt gcatccaagc actcggattg
     1561 acacggtcgg catcacgcat cttggttacc ggaatctctt cggtgaaagc agacacgacc
     1621 aggggatgca gcaccttgca tatcaagtct cgtatctccg aggatcagtt ggttgtctac
     1681 gcgcacgtgc taggcaggat cacttcttcg ctggaaaggc aaaacatcga tgcatcggcg
     1741 ctcaaggttt tcaaggatct gcagttggcg gatactgaat tcaacacaaa ctcacctgtt
     1801 gacattctat tgggcagcga acacgtatgg tcagtgttta caggacgaaa gatgttcgac
     1861 aacaaggtgg acataggtgc cacgcttcag aagttttggg aactagaaaa cgttcaaagc
     1921 agcgcaaaat tggaaccgga ggatgatcaa gtggagaagc attttctcgc cactcacagt
     1981 cgcgatgtaa acggaaagca tatcgtggaa cttccattca acactgaaaa ccccgaattc
     2041 ggaggaactc tacaaggagc gctcaaacgc tttaaatcgg ctgagcggcg gctgcaacag
     2101 aacgagcagc tgcggcccag tatccagcgc gatctattcg ctgtgtgcct tcgttttcga
     2161 atgtacaaat ttgcattctc agcggacatc gtaaaaatgt tccgccagat atgggtcaac
     2221 gaaaagcaca gaaacttcca gaaaatcgtt tggagagaag atccatccga tcccatcaag
     2281 catttccaat tgtgcacggt aacctacgga acttcgtgcg cgccattcct ggcggtgcga
     2341 gtgctggaac aacttgctat cgatcatcaa gaggaatacc caaatgcgtc gaaaatcctg
     2401 ctggaggatt tttatgtcga tgatgttctt actgggtcaa acagtgagga tgagctactt
     2461 cgaaaccgaa acgagctggt tgagctgatg tctcgcgcca accttgaact cggaaaatgg
     2521 gtatcgaata cgccatgtat acaaacggat aatagcgaca cacaatctgc acaaatttca
     2581 ccagtgaagg ttctcggact gtactggcat cctggaaacg acgttctaac gtacaacgtc
     2641 ggtcttgctg caaatcctga ttgcacaaag agacaagtct tgtccgacgt ctcgaggata
     2701 tttgatcctc tcggactctt ggcacccatt gtcattcaat tcaaaatcct tttccaaaag
     2761 ctctggctct tgaatttgga ttgggatgac ccactcccaa ctaaactggc ggacaactgg
     2821 ctgaagtgga gagcagatct ggacactctt caaaaattcc gactaccacg atttgttcac
     2881 aacgacccgg acaacatcga actccacgga ttttcggatg cttcaaccaa ggcgtatgct
     2941 gctgtggtgt acagcagagt tacaaatgac gatggatcca tctcggtgtc cattgtggct
     3001 gcgaaaacaa gggtggctcc actgaaacaa caatccttgc cacgtctgga actttgcgca
     3061 gcacttctcc tcagccaact gattcgctca atcacatctg gattacgcca caagaacata
     3121 actgtttttg gctggtccga ctcatcaata gtgctctcct ggctatcgta tgcgccagcc
     3181 caactcaaga catttgttgg aaacagaacc tcggaaatcc ttgacaccat tccaaggagc
     3241 gcttggcgtc acgtcgattc caaaacaaac ccagctgact gtgcgtccag gggattgatg
     3301 gctgctgatc tcatcgactt ccatttgtgg tggaatgggc ctcaatggct acgggacaag
     3361 gatcagtacc tggtaaagtt aaatgattca cggttcggtt tatctcttac agacaaacgc
     3421 attcaaggag aagtcaaatc caactgtttg gctacattga cagaagcaac ccagattcat
     3481 ctacttgatg aactaatcga acgagtctct tcttggatca agctcgtaca cattgtcggc
     3541 tacgtgatgc ggtttattca acgtactcga aatccatctc gcgaaaaggt atccggagca
     3601 ctctcatttg acgagatcaa agcggcaagg attctttgca taaagcacgc acaagggtgt
     3661 ttcaaagacg attaccaact actcctcggt aaaaaacccc tcaagaaccg atcacagctg
     3721 gtcaaactgg cacccataat cgacgaaaac gatttgctaa gggtaggcga acgactgcat
     3781 cactcgcagt tgtcaaggga tgcaaaacac ccagttttgc taccgaaaac acatcgcata
     3841 tcaaagctaa ttctggaaca tgagcaccga gtgaaccacc accctggagt ttcctcactt
     3901 tttgttattg ttcggcaaaa attctggata tttggagcac ggaatctaat tcggaagata
     3961 acacacgact gtttagcttg ctttcgtcaa cgctcccaca catctcagca acaaatggct
     4021 aatttaccca gcgtacgcat tactcaagcg cttccattta tacatactgg ttgcgactat
     4081 gcaggtccaa tccttctgaa ggatgcaaag gttcggaagc cacgtatcag caagggttac
     4141 atatgcctat ttgtgtgcat ggtcacctcg gccatccacc tggaacttgc aacagacctg
     4201 accacagaaa ctttcttggc tgccttgcgg cgcttcatat ccttacgtgg caagtgcagt
     4261 aagatctaca gtgacaatgg cacaaacttt attggagcta agcgatccct cgacgagatg
     4321 caagaattgc tttcttcaca aacacacaag gacaccgttt ctagcacact agcggatgat
     4381 ggtatccaat ggaatcaccg gaaactcaac gctcaccttt ga