PREDICTED: Drosophila obscura neurogenic protein mastermind


LOCUS       XM_022354798            4922 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111066307), transcript variant X4, mRNA.
ACCESSION   XM_022354798
VERSION     XM_022354798.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022354798.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..4922
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..4922
                     /gene="LOC111066307"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 1 Protein, and 98% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     4 samples with support for all annotated introns"
                     /db_xref="GeneID:111066307"
     CDS             855..4844
                     /gene="LOC111066307"
                     /codon_start=1
                     /product="AF4/FMR2 family member lilli isoform X4"
                     /protein_id="XP_022210490.2"
                     /db_xref="GeneID:111066307"
                     /translation="MALSKRPLAKDTPLAESNSNNHNHSHSHSHSHSGGNSINNSSDL
                     ETTAIKRRKRCSRDEDATLNNNNNNSNSNNNNILPQKKRKQGPILDSPESPPPTSVHT
                     VGTVAAGIAKMTAPGGAADADQDDETLIRETQAALKSLSGSWPDARANLYRLQEQDEN
                     PPPFQNLFEEKQKYEAIAPRTPTTTATVSMFPRFHRQKENDQARLNAGATLEDRERGK
                     KLAPVTATGTALGGGPDDMDLEEAASNVYAQAASAFKPPIDFIKRNYAAAAHAHAHAQ
                     AQAHAHAHYTTSAYNASAATESAAGLAYYGYAAAAAASQQQQQQHQQHQQLSLEPTPL
                     PPRAAFDIASQLGEKPSKTSKEPLLGALPGTGTGHGGSQVDAKQYTILQPAGVGSRAA
                     SVMQDIAREGVVGVPLVATPPSTSSPPTAGGTAASTASATATLTSTSTPAPSYSPGSQ
                     NRADLEKHEKELHPLDKLKIASSHYLNNNNTSCINNNNNNNKLSATTMPIIKSEYSPV
                     ASIKSEYNKSPMHSYLANDAAGPGPGPASSVTASASTTPGTARTASGGGATNGGGGGG
                     GGGTTSSNGGDANLHAPHLNRFVGMQSPPHPQSHHSHAHHVQQQQQQQQQQQQHTLHQ
                     QRGPFINEGNDGPDPSASYHTEHQQQQQQQQQQQQQQQQAEERQYEQMRYAVGGELLS
                     SNGGANASELSPGTARSAYEAHPHPHPHPHPHPHPHPPTSLSSLSSASVGVGAPAFAT
                     VDSVSAVTVSTGAGGFERYDPNCCPNGQRQVASVAGVAAASASAAAAAAAYHYLPQSA
                     DDLQVQQQKYLQEQQLMLAKAEHEEQLANGGGAGPIYPRPMYHYDPTMGPLPPGFSAI
                     NLSVKMAAAQAAAAAAAYQNQQQQQQQQQQQHHQQQQQQQQQQQQQQQQQQQQQQQQQ
                     QQQHGKQSSSPTPNVGGVPAPAVDLSGSTSVTSSSPHGFNSPASHNQYNQRMGNGSPQ
                     PGASPNIASPQVPSPQGQTLDLSVTRLPHSIITSPQYGADGLVVGHAQGFGSGAPGGA
                     LGPNGPPRSPQMEPVDFSGPPRPLGFGLVGHISGPRPYSRESTPDSGGSHYIETYRDP
                     SGYSPHPGYGMVVQSDYPPAGYHGYGPAAYQCSNPYATAVGPGGYPTPVSGGYSPSPA
                     TCYSMPPPQHIPQHDKTKDGLTGCSRSDRNHLQSHSQELKCPTPGCDGSGHVTGNYSS
                     HRSLSGCPRANKPKSKPRDGQDSEPLRCPIPGCDGSGHSTGKFLSHRSASGCPIANRN
                     KMRVLEAGGTVEQHKAAVAAATAMKFDACTTVGGQGIKKPKFDEVTMVYPKGYTDYAT
                     FCIGAEYLL"
     misc_feature    <3621..4328
                     /gene="LOC111066307"
                     /note="large tegument protein UL36; Provisional; Region:
                     PHA03247"
                     /db_xref="CDD:223021"
     misc_feature    4410..4496
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
     misc_feature    4545..4631
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
ORIGIN      
        1 ttgctgctgc tgcgccgcac gctgctaaca ccgctgcttc tgtcagcgtc gacgccaact
       61 gagctggtcg tcgcgctgct gccgatgtaa aattttatta ccccaaaacg catccagcag
      121 tcgggttttg gacgtccgga ctacaccgcc gcctcgctga gacagacgac ttttattgca
      181 attctctcgc ccaagcggcg aaaaagcggc cccagaccca gaggccaacc tctttttaga
      241 gaaactaacg gacggagaca gcgatacgga gatacgcaga aacgtagaca cacgaagagc
      301 agcaaagaaa gcacggagaa cacaaaagaa accacggaga agcacggagg ccacagagac
      361 atttcaaact tttgcgcggc atcaaagtta cgacaaaaca acaaaaaaaa aaaacaaaaa
      421 acttttccaa actacgcgca aaactaaaat caactcttcc ggaggtcgtg ctgcttatag
      481 actagtagcc ccagccccag ccccttcttc cgatccacaa caccctcttc ccccacaccc
      541 cttagcaccc gattttgaaa cagtgcagtg caaacaataa ataagaaaca aaacgaacaa
      601 aaacaaaccg aaatatagtg gcaacaacaa ttgtcccaaa aagtggaaag ttcgcggcct
      661 aattgatatt gcgtatacgc ctccgatgcc gcaaaatttg tgcacgctcc atcggccgat
      721 ctaccaagaa gaactttaaa ctgttaaatc cctgaagacg tcgaagcggc gtgccgcagc
      781 cgaaccgttg aaaaattcat acaaatttga accaaccaaa cgaactggct tagagcagta
      841 gagccaccca caagatggcg ctgtccaagc ggccactcgc caaggatacg cctttggcag
      901 agagcaacag caacaaccac aaccacagcc acagtcacag ccacagccac agcggtggca
      961 acagcatcaa caacagcagt gatctggaga cgacagctat caagcgccgg aaacgttgca
     1021 gtcgcgatga ggatgcgaca ctcaacaaca acaacaacaa cagtaatagc aacaataaca
     1081 acatattgcc acaaaagaaa cgaaaacagg gccccatact ggatagcccc gagagtccac
     1141 ctccgacaag cgtccacact gtcggaacag tagccgccgg aatagccaag atgacagctc
     1201 cgggcggcgc cgccgatgct gatcaggatg atgagacact catacgggag acgcaggcgg
     1261 cattgaagag tctgtccggt agctggcccg atgcccgggc caatctgtac agattgcagg
     1321 agcaggacga gaatccaccg cccttccaga atctcttcga agagaaacaa aagtatgagg
     1381 ccattgcacc cagaactccc acaacaactg caactgtatc catgtttcca cgtttccaca
     1441 gacagaagga gaatgaccag gcccgcctca atgccggcgc cacgctcgag gatcgcgagc
     1501 ggggcaagaa gctggccccg gtcacagcaa ctggcacagc tctgggtggt ggaccagacg
     1561 acatggatct ggaggaggcc gccagcaatg tgtacgccca ggccgcctcg gccttcaagc
     1621 cgcccatcga cttcatcaaa cgcaactatg cggccgctgc ccacgcccac gcccatgccc
     1681 aggcccaggc ccatgcccat gctcactaca cgacaagcgc ctacaatgcg tccgcagcaa
     1741 cagagtccgc cgccggattg gcctactatg gctatgcggc agccgccgcc gccagtcaac
     1801 agcagcagca gcagcatcaa cagcatcagc aattgagcct ggagccgact ccattgccac
     1861 cacgggccgc ctttgacata gccagccagc tgggcgaaaa gccttcaaag accagcaagg
     1921 agccgctgtt gggagcattg ccaggaacgg gcacaggtca tggtgggtcc caggtggatg
     1981 ccaaacagta tacgatcctg cagccggcag gcgtgggcag tcgggcagcc tcagtgatgc
     2041 aggacattgc ccgggagggt gttgtcggtg tacctctggt tgccactcca ccatccacga
     2101 gtagtccgcc aacagcagga ggaacagcag catcgacagc atcagcgaca gcgacattga
     2161 catcgacatc gacgccggcg cctagctact cgccgggcag ccagaatcgc gcggatttgg
     2221 agaagcacga aaaggagctg catccattgg ataaactgaa gatcgcctcc agtcactatc
     2281 tgaacaacaa caataccagt tgcatcaaca acaataacaa taacaacaag ctgagtgcaa
     2341 caacaatgcc cattatcaaa tcggagtaca gtcctgtagc gagcatcaaa tcggagtaca
     2401 acaaaagccc aatgcactca tatctggcca acgatgcagc cggccccggg cccggccccg
     2461 cctccagtgt gacggccagc gcatccacaa caccgggcac cgctcgcacc gcatccggcg
     2521 gtggggcaac taacggtggt ggcggtggcg gtggcggtgg cacaacctcc tccaatggtg
     2581 gcgatgccaa tctgcatgcc ccgcacctga atcgctttgt gggcatgcag agtcctcccc
     2641 acccacagag ccaccactca cacgcccacc acgtacagca gcagcagcag cagcagcaac
     2701 agcagcagca acacacactc caccagcagc gcggaccctt tataaacgag ggcaacgacg
     2761 gtcccgatcc ttctgccagc taccacacgg agcaccagca acagcagcaa cagcagcaac
     2821 agcaacagca acagcagcag caggccgagg agcggcagta cgagcagatg cgctacgccg
     2881 tgggcggtga gctgctgagt agcaatgggg gagccaatgc cagcgaactg tcgcctggaa
     2941 cggcgaggag tgcctacgag gcgcatcccc atccgcatcc acacccacat ccgcatccac
     3001 atccgcaccc gcccacctcg ctcagctccc tcagcagcgc atcggtgggg gtgggggcgc
     3061 ccgcctttgc cacagttgac tccgtgtcgg cggtgaccgt ttcgactggg gccggcggct
     3121 tcgagcggta cgaccccaac tgctgtccca atggacagcg ccaggtggcg tctgtggcgg
     3181 gcgtggcagc tgcctcagca tcggcagcgg cggcggcggc agcctatcac tatctgccgc
     3241 aaagcgccga cgatctgcag gtgcagcagc aaaagtatct gcaggagcag cagcttatgt
     3301 tggccaaggc cgagcacgag gaacagttgg ccaatggcgg cggtgcgggg ccgatatatc
     3361 cacggcccat gtaccactac gatcccacca tgggccccct gccgccgggc ttctccgcca
     3421 tcaatctgtc cgtgaaaatg gccgctgccc aagcggccgc cgccgcagcc gcctatcaga
     3481 accagcagca gcagcaacaa cagcagcaac agcaacacca ccagcagcag cagcagcagc
     3541 aacagcagca acagcagcag cagcaacagc agcagcagca gcaacagcag caacagcaac
     3601 agcagcacgg caaacagagc tcctcgccca ccccgaatgt gggaggcgtg ccagcgccag
     3661 cggttgacct atccggatcc acatcggtga cctcctccag tccgcacggt ttcaattcac
     3721 cagcctccca caaccaatac aaccagcgca tgggcaacgg cagcccacag ccgggcgcca
     3781 gccccaatat agccagcccc caggtgccca gtccgcaggg acagaccctg gacctcagcg
     3841 tcaccagact cccacacagc atcatcacca gtccccagta tggggccgat ggccttgtcg
     3901 tgggccatgc ccagggattt ggcagcggag cgcccggcgg agctctgggc cccaacggac
     3961 cgccgcgctc cccacaaatg gagcccgtcg atttcagcgg cccgccgcga ccactaggct
     4021 tcggactggt cggacacatc agtggaccgc ggccctacag ccgtgaatcc acgccggaca
     4081 gcggcggttc acactacatc gagacgtaca gggatcccag cggatactcg ccacatcccg
     4141 gatacggcat ggtggtgcaa tcggactatc caccggctgg ctatcatggc tatggcccag
     4201 ccgcgtatca gtgcagcaat ccgtatgcga cggcggtagg acccggcggc tatccgacgc
     4261 ccgtctccgg cggctattca ccaagcccgg ccacctgcta ctcgatgcca ccgccgcagc
     4321 acataccgca gcacgacaag accaaggacg gattgacggg ctgctcgcgt tccgaccgga
     4381 atcatctgca atcgcactcg caggagctca agtgccccac gcccggctgc gatggctctg
     4441 gccatgtgac cggcaactac tcatcgcacc gcagcctctc cggatgtcca cgggccaata
     4501 aacccaaaag caagccgcgc gatggccagg actcggagcc gctcagatgt cccataccag
     4561 gatgcgatgg ctccggtcac tccaccggca agtttctctc ccacagaagt gcttcgggct
     4621 gtcccatagc aaatcggaac aagatgagag tcctggaggc tgggggcact gtggagcagc
     4681 acaaggccgc tgtggctgct gccacagcta tgaagttcga tgcctgcacc actgtgggtg
     4741 gccagggaat caagaagccc aaattcgatg aggtcaccat ggtctatccc aagggttata
     4801 cagattacgc aacattttgt atcggtgccg agtatctact gtagatagaa aatgaaactg
     4861 atcaaaaaca gtccgaaata tcgaaaacct gaaaccacaa ccaccaacca aaaataaatg
     4921 aa