Unfortunately due to lack of commercial feasibility, the SkyBLAST service has been suspended from December 1st, 2025.
All subscriptions for paid accounts have been paused. For further information or enquiries, please email [email protected]

PREDICTED: Drosophila takahashii uncharacterized protein


LOCUS       XM_044396095            6482 bp    mRNA    linear   INV 09-DEC-2024
            (LOC123003484), transcript variant X2, mRNA.
ACCESSION   XM_044396095
VERSION     XM_044396095.2
DBLINK      BioProject: PRJNA1194641
KEYWORDS    RefSeq.
SOURCE      Drosophila takahashii
  ORGANISM  Drosophila takahashii
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NC_091683) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On Dec 9, 2024 this sequence version replaced XM_044396095.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI RefSeq
            Annotation Status           :: Full annotation
            Annotation Name             :: GCF_030179915.1-RS_2024_12
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 10.3
            Annotation Method           :: Gnomon; cmsearch; tRNAscan-SE
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            Annotation Date             :: 12/07/2024
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..6482
                     /organism="Drosophila takahashii"
                     /mol_type="mRNA"
                     /strain="IR98-3 E-12201"
                     /db_xref="taxon:29030"
                     /chromosome="X"
                     /sex="female"
                     /tissue_type="Whole fly"
                     /dev_stage="Adult fly"
                     /collected_by="Originally obtained from EHIME-Fly"
     gene            1..6482
                     /gene="LOC123003484"
                     /note="uncharacterized LOC123003484; Derived by automated
                     computational analysis using gene prediction method:
                     Gnomon."
                     /db_xref="GeneID:123003484"
     CDS             833..6043
                     /gene="LOC123003484"
                     /codon_start=1
                     /product="uncharacterized protein isoform X2"
                     /protein_id="XP_044252030.1"
                     /db_xref="GeneID:123003484"
                     /translation="MAADKDQEQGQASSDASLSNLHILQADIFERVKQLYQNFKKDSQ
                     SRKTKIYFQTRINKLENFSKEFDTNHQTLLLNGCSPEHEYFTSQLAARFEESYLTYYC
                     EIGDAFETRFPTVPSDATPSHSNSTMHNTTMLQAPGSTVQLPKLPVPSYSGKLTEWPA
                     FHDVFQQLIHDNGALSSIQKFHFLKQALPADRDQDVHQMDLTEANYLVAWSLIVTRYN
                     NPRLLFMHHMNTLYELPSISKESSAELKHMLNVANVCINEFKRLNIAIANCDHWIVHH
                     LTTKLPSQTIQAWEHSLGSTKEIPTFFTLESFLNNRLFSIDIIEGRKVPPPPRQPQGV
                     NGFQRNVIKHSGNAQTRISSCHTSGVTTNSVRCAHCNDQHILRRCPDFLAKDSFARKL
                     IVDRSKVCLNCLSPTHSLSKCNSSKNCLQCGQRHHTLLHFPTQVKASDVAQSAGNITS
                     LNSQGLTASSNTTQLISASASHSTPHTMILATALVRLHSNATGQSAVVRALIDHGSEG
                     TLVTETVVQALGLPRFPVSAEISGVGGNSTNRCKYRTECTLSSTTNSGFKMWVENAFV
                     LRTLTSPLPRTNLTLPTCPHLTGLELADPNFMHTNSIDVLLGVDTIPQFMMSGIRRGS
                     YDQPIAQCTQLGWIIFGRITPKQTHTISIQCHHSNLETLVQKFFELEARKFQKKPDLY
                     EQYSKVMEEYFELHQITEAITSEEQHRLADKGGSISYTACTLPHHAVLKADSSTTKLR
                     VVYDASCKTSNGKSLNDILCIGPALQNDLGGVILNWRFLQYVFAADIQKMYRCIDVHP
                     EDTHFQRIIWQRENNAIKDYCLTTVTFGTASAPYTAIRIMHQIAQDERDQFPLAEHVL
                     RKEIYVDDLQSGHETIKGALQVRDDVIGALQSAGMELRKWAANHPSLLNSIPPEHMSN
                     SKILEIENQESIKTLGLYWHPKEDFYGFKLKFTIDEIFTKRSILATVARLYDPLGFVA
                     PVIIIAKVILKEVWSIRIQQADGTPAGLAWDATVPPVIQHKWKEYCTNLLKIESLRIP
                     RWLQYLPSTIASLQLHIFCDGSSMAYAACAYVRVQHTNNSVYTHLIAAKSRVTPTKPL
                     TIPRVELCGAVLAAQLGDWLCKQIDQPTHPISTYFWSDATIVLYWIAGDPLHWKTFVA
                     NRVGRILESSSASQWRHVPTGDNPADCATRGLYPDQLAAYDLWWQGPSWLRLPESQWP
                     SKIFDIPDSTNLSCEQKSLSLQTHSCVERNPNSLLTSFSSYNKLLFIMAYVRRFIHNS
                     QTRVDSRQRGPVTAQEFQQALGHIVRLVQHETFKVEIQKIKTKTHLSRSNKLSQLSPF
                     LDNEGVLRVRGRLKNALHLSPHQRTPIILPKDHHFTELVIRNAHLNTLHGGISLTLAV
                     TRQTFWILNGKQAVKKILHKCVDCFKHRPKAVTQLMGDLPLHRVNPPKRAFEATGVDY
                     TGALEIKASKFRGHHKYKAYIAVFICLATKAVHLEAVTGLSSQDFLWALQRFIGRRGY
                     CQHIYSDCGTNFIGADKSLNLWHEEFRQSVIATVIPKLTAQQIQWHFNPPHSPNFGGL
                     WEANVKAVKTHLHRTCKGALMTYEQLSTILVQIEACLNSRPLCPLSSDMEDLAVLTPA
                     HFLIGDSMMALPNPSASDKSLNAQFLEGQRLLRTFWHRWSSDWLSHLQSRPKWQRVEE
                     NLRLHDIVIIKDDRLPPNEWKLGRIVELHPGSDNLIRVASIKTASGIYKRSLSKICPL
                     PLATYSEATE"
     misc_feature    1283..1726
                     /gene="LOC123003484"
                     /note="Protein of unknown function (DUF1759); Region:
                     DUF1759; pfam03564"
                     /db_xref="CDD:281552"
     misc_feature    2297..2749
                     /gene="LOC123003484"
                     /note="Cellular and retroviral pepsin-like aspartate
                     proteases; Region: pepsin_retropepsin_like; cl11403"
                     /db_xref="CDD:472175"
     misc_feature    order(2339..2341,2345..2347,2351..2353,2420..2428)
                     /gene="LOC123003484"
                     /note="inhibitor binding site [active]"
                     /db_xref="CDD:133137"
     misc_feature    2339..2347
                     /gene="LOC123003484"
                     /note="catalytic motif [active]"
                     /db_xref="CDD:133137"
     misc_feature    2339..2341
                     /gene="LOC123003484"
                     /note="Catalytic residue [active]"
                     /db_xref="CDD:133137"
     misc_feature    order(2420..2431,2441..2452)
                     /gene="LOC123003484"
                     /note="Active site flap [active]"
                     /db_xref="CDD:133137"
     misc_feature    3002..3646
                     /gene="LOC123003484"
                     /note="conserved catalytic core domain of RNA-dependent
                     RNA polymerase (RdRp) from the positive-sense
                     single-stranded RNA [(+)ssRNA] viruses and closely related
                     viruses; Region: ps-ssRNAv_RdRp-like; cl40470"
                     /db_xref="CDD:477363"
     misc_feature    order(3188..3205,3305..3310,3413..3415,3419..3424,
                     3632..3637)
                     /gene="LOC123003484"
                     /note="active site"
                     /db_xref="CDD:238822"
     misc_feature    order(3188..3205,3305..3307,3419..3421)
                     /gene="LOC123003484"
                     /note="NTP binding site [chemical binding]; other site"
                     /db_xref="CDD:238822"
     misc_feature    3308..3310
                     /gene="LOC123003484"
                     /note="nucleic acid binding site [nucleotide binding];
                     other site"
                     /db_xref="CDD:238822"
     misc_feature    3689..4210
                     /gene="LOC123003484"
                     /note="Pao retrotransposon peptidase; Region:
                     Peptidase_A17; pfam05380"
                     /db_xref="CDD:461634"
     misc_feature    4886..5056
                     /gene="LOC123003484"
                     /note="Integrase zinc binding domain; Region:
                     Integrase_H2C2; pfam17921"
                     /db_xref="CDD:465569"
     misc_feature    5747..6010
                     /gene="LOC123003484"
                     /note="Family of unknown function (DUF5641); Region:
                     DUF5641; pfam18701"
                     /db_xref="CDD:465838"
ORIGIN      
        1 cggacgtttg ctgtagttga gagaacataa acccaccact ctgttataac cgagttttat
       61 gtaaagggag tcacaagaga gagaacgatc gacgattctt ttatgggcat cgaacagaag
      121 cagtcatccc agccgctggt cgcgtttaat aatctaatat aataaattaa aattgatacc
      181 attgtcagca ttgaagattg taaagtgaaa aaactgaatt cgaagtaatt gtagataata
      241 aatagaccat ccatgaagtg caccttttag agttataatt ttcaaattgg tggaaaaacc
      301 ccagagcatc tttgctcatc tttgacaata taaattgtca caacattttg gtggcccatg
      361 aggggaccca tccaatcacg ccttctggaa taattatcta ctaatctgtt ttcgaattaa
      421 ttaatcagtt tggatctaaa ctttgtgaaa tctggcacat ggttataaat tttccattcg
      481 caactacata taaccagcaa acggcagcac atgtataagt gctgttacac tatcgtccca
      541 tacgctttac cctccaactg cgctgccctg ccgatccatc gctttgccga agtcaacgtg
      601 ggttaattta gatgctggag agaagctgtt tcgctgccga aatctatcac gtcgcatccc
      661 ccacaccttt tcgtcaaacc tggagcgact tcacttggac ttccagactt ttcgttcaat
      721 ttcgttacgt cacaacttga aaggggtaag tgtcgttgtg gtgtgttggt gagttgacaa
      781 agtattgagt acatttttca gtgtataaga gtaatacaat caaagctgaa acatggcagc
      841 agataaagac caggagcagg ggcaggcatc cagcgatgcc agcctatcaa acctacatat
      901 acttcaagct gatatttttg aacgtgttaa acaactttat caaaatttta aaaaggatag
      961 tcagtcaaga aaaactaaaa tctattttca aactcgtata aataaacttg aaaatttctc
     1021 aaaggaattc gacaccaatc atcaaactct tttattgaac ggttgctcac ctgaacatga
     1081 atattttacc tctcaactag cagcaaggtt tgaagagtct tacttaacat attattgcga
     1141 gattggagac gccttcgaga cccggtttcc aacagttccc agcgacgcta ctcctagcca
     1201 ttctaattca acgatgcaca acaccaccat gctacaagcg cctggctcta cagttcaact
     1261 accaaaatta ccagtaccta gttattctgg caagctgact gaatggccag cctttcatga
     1321 tgtctttcaa caacttattc acgataatgg tgcactttcc agcatacaaa aattccactt
     1381 tctgaagcaa gcactcccag cggaccgaga tcaagacgtg catcaaatgg acttgactga
     1441 agcgaattat ctcgtcgcct ggagtctcat tgttacgcgt tataataatc cccgattgtt
     1501 attcatgcat catatgaata ccctatatga gttgccatca atttccaaag aaagttcagc
     1561 cgaactaaaa catatgttaa acgttgccaa cgtttgcatc aatgagttca aacgcctcaa
     1621 cattgcaatt gccaattgcg atcattggat tgtgcatcat ctcaccacta agctgccatc
     1681 gcaaactatc caagcctggg aacacagtct tgggagtaca aaggaaatcc caaccttttt
     1741 cactttggaa tcatttctca acaaccgact ttttagcatc gatataattg aaggtcgcaa
     1801 ggttccacct ccaccacggc aaccacaagg agtcaacggc ttccaacgaa acgtcatcaa
     1861 acattcaggc aacgcacaaa ccaggatcag tagctgccat acttcagggg ttactaccaa
     1921 ctctgttcgc tgcgctcatt gcaatgacca acacatctta cgtcgttgtc cagacttttt
     1981 agcaaaggat tctttcgctc gcaaacttat tgttgaccgc agtaaggtat gtctcaattg
     2041 cctcagcccc acccattctc tgtcaaaatg taacagcagc aaaaactgtt tacaatgtgg
     2101 acaacgccat cacactctct tacatttccc aacccaggta aaggctagtg atgtcgcgca
     2161 gtctgcagga aacataacta gtctcaactc acagggtctg acagcatcta gcaacaccac
     2221 acagctcatc agcgcgtcag cctcacattc aacacctcat acgatgattc tcgcaactgc
     2281 tctggttcgt cttcatagta atgccacagg tcagtcagcg gtggtccgag cccttatcga
     2341 tcatggatca gaaggtaccc ttgttacgga aactgtagtc caagcgctag ggcttccccg
     2401 atttccagtc tcagcagaaa tatcaggggt aggagggaat tccaccaaca ggtgcaaata
     2461 tcgcaccgaa tgtactttaa gctcaactac taattcagga ttcaagatgt gggtggaaaa
     2521 tgccttcgtt ttgcgtaccc tgacttctcc tttaccaagg acgaatctaa ctctaccaac
     2581 gtgtccacat ttaactgggt tggagctcgc cgacccaaat tttatgcaca ctaatagcat
     2641 agatgtgctc ctcggcgtgg acaccattcc acaatttatg atgagtggaa tcaggagagg
     2701 atcttacgat caaccaattg cccaatgcac gcaacttggt tggatcattt ttggcagaat
     2761 tacgccaaaa cagacacaca cgatatccat acaatgtcat cattctaatc tggaaactct
     2821 agttcaaaaa ttcttcgaat tggaagcacg aaaattccaa aagaaaccag atctgtatga
     2881 acaatactca aaggtcatgg aggaatactt cgagctgcac caaataactg aagccatcac
     2941 ctcagaagaa cagcatcgcc tggcggacaa aggaggctca atcagttata ctgcatgcac
     3001 attaccccat catgcagttc tgaaggcgga cagcagcacc acaaaacttc gagttgtgta
     3061 cgacgcctca tgcaagacat caaatggaaa atcgctcaac gacattctct gtataggccc
     3121 agccttacaa aacgaccttg gtggggtcat tctcaattgg cgatttttac aatatgtctt
     3181 tgcggccgat attcagaaaa tgtatcgttg catcgatgta cacccggagg atacacactt
     3241 ccaacggatt atttggcaaa gggaaaacaa tgctataaag gattattgtt taacaactgt
     3301 gacgtttgga acagcatcag ccccgtacac agccattcgc atcatgcatc agatcgctca
     3361 ggatgaacga gatcaatttc cattagcaga acatgtttta cgaaaagaaa tatatgtgga
     3421 tgatttgcaa agtggacatg agacaattaa gggagccctt caagttcgag atgatgtcat
     3481 cggggcactt caatcagctg gtatggagct tcgaaaatgg gcagcaaatc atcccagtct
     3541 tttgaactct attcctcctg agcacatgtc caattccaaa attttggaaa tcgaaaacca
     3601 agagtccatt aaaactttgg ggctatattg gcaccccaag gaagactttt atggtttcaa
     3661 attaaaattt acaattgatg aaattttcac taaacgatca attcttgcta cagttgcacg
     3721 tctgtacgat cctttaggtt tcgttgctcc agtcataatc atcgccaagg ttattctcaa
     3781 agaagtctgg agcatacgta ttcaacaggc tgatggcact ccagcaggat tagcttggga
     3841 cgcaacggta ccgccagtaa ttcagcacaa gtggaaagaa tactgcacca atttacttaa
     3901 aattgaatca ctgagaatac cccgatggtt acagtattta cccagcacca tcgcatcctt
     3961 gcagctgcat atcttttgtg atggctcttc tatggcatac gcagcgtgtg cctatgtgcg
     4021 ggtccaacat acaaataact cggtatacac gcatctcata gctgcaaaga gtcgagtcac
     4081 acccacaaag ccgttgacaa ttcctagagt ggaactatgt ggagctgtac tcgccgcaca
     4141 actgggtgac tggctctgca agcaaataga tcaaccaacg catcccattt cgacctattt
     4201 ctggagcgac gcaacgatcg ttctttattg gattgcgggg gatcccttac attggaaaac
     4261 attcgtagcg aatcgtgtag gacgaatttt ggagtccagt tctgcatctc aatggagaca
     4321 tgtgcccacc ggagataacc ctgcagactg cgcgacgcgt ggtctctatc cagatcaatt
     4381 agctgcctat gatttatggt ggcaggggcc ttcttggcta cgactaccag aatctcaatg
     4441 gcctagcaaa atctttgaca ttcctgatag caccaatctc tcgtgtgagc aaaaatcgct
     4501 ttctctacaa acccacagct gcgttgagag aaatccaaac tctttactca cgtcgttttc
     4561 atcttacaac aaacttctgt ttataatggc ttacgtacga cgctttattc acaattcaca
     4621 aacgcgcgtg gactctcgac agagaggtcc agttaccgcc caggagtttc agcaggcact
     4681 agggcacatt gtccgactag tgcaacatga aacgtttaag gtggagattc aaaaaataaa
     4741 gacaaaaaca catttatcta gatcgaacaa attaagtcaa ctttccccat ttctagataa
     4801 cgaaggagtg ctgcgtgtcc gagggagatt gaaaaatgca ttgcacctat cgccgcatca
     4861 acgcacaccg atcattttgc caaaggatca tcattttacc gaacttgtca ttcgtaatgc
     4921 tcatctcaac acattacatg gcgggatatc acttacactg gcagtgacaa ggcaaacgtt
     4981 ttggattctt aatgggaaac aggcagttaa aaagattctg cacaaatgtg ttgactgctt
     5041 caagcacaga ccgaaggcag tcacgcagct catgggagac cttcccttac atcgagtgaa
     5101 cccaccaaag cgagcctttg aagccacagg cgtggactat accggtgcgc tagaaatcaa
     5161 agcgtcaaag tttcgtggac accacaaata caaggcatat attgcagttt ttatatgctt
     5221 ggcgacaaag gcagtccact tggaagctgt taccggattg tcttctcagg attttttgtg
     5281 ggctctacaa cgttttattg gcagacgtgg atactgccaa cacatctaca gcgattgcgg
     5341 taccaatttc attggagcag ataaatccct aaacctttgg catgaagagt ttcgacaaag
     5401 cgttatcgca acggttattc caaaattaac cgctcagcag attcaatggc atttcaatcc
     5461 gccacacagc ccaaacttcg gtggattatg ggaggcgaat gttaaagcgg ttaagacaca
     5521 cttacatcgc acgtgtaaag gggcgctcat gacctacgaa caactctcaa ctattttggt
     5581 tcaaatcgaa gcctgtttga actctcgccc actttgcccg ttgagctcgg atatggagga
     5641 tttagcagta ctgacaccgg cccatttctt aattggcgat tccatgatgg cgctacctaa
     5701 tccatcagct tcggataaat cgttaaacgc acaattcttg gaaggacaaa gactgcttcg
     5761 aaccttttgg catcgttgga gctcggattg gctttcacac ttacaatctc gtccaaaatg
     5821 gcagcgggtt gaggaaaact tgcgtttaca cgacatagtt attattaaag atgatcggct
     5881 tccgccaaat gaatggaagc tcggtcgcat agtcgaatta catccaggat ctgataatct
     5941 cattcgagtc gcatctatta agacggcatc cggaatttat aaacgctctt tgtcgaaaat
     6001 ctgtccattg ccattagcta cttattcaga ggctacggaa taaacattaa ttacgtacat
     6061 actttgtcca cctctacata tcgtaatgac acttatttct ttacagcaaa gtgcagaaat
     6121 ttggtttaaa tactggactc agtatttggg ggcggcatgt tcggacgttt gctgtagttg
     6181 agagaacata aacccaccac tctgttataa ccgagtttta tgtaaaggga gtcacaagag
     6241 agagaacgat cgacgattct tttatgggca tcgaacagaa gcagtcatcc cagccgctgg
     6301 tcgcgtttaa taatctaata taataaatta aaattgatac cattgtcagc attgaagatt
     6361 gtaaagtgaa aaaactgaat tcgaagtaat tgtagataat aaatagacca tccatgaagt
     6421 gcacctttta gagttataat tttcaaattg gtggaaaaac cccagagcat ctttgctcat
     6481 ct