PREDICTED: Drosophila obscura neurogenic protein mastermind


LOCUS       XM_022354797            5037 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111066307), transcript variant X3, mRNA.
ACCESSION   XM_022354797
VERSION     XM_022354797.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022354797.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..5037
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..5037
                     /gene="LOC111066307"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 1 Protein, and 98% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     1 sample with support for all annotated introns"
                     /db_xref="GeneID:111066307"
     CDS             856..4959
                     /gene="LOC111066307"
                     /codon_start=1
                     /product="neurogenic protein mastermind isoform X3"
                     /protein_id="XP_022210489.2"
                     /db_xref="GeneID:111066307"
                     /translation="MALSKRPLAKDTPLAESNSNNHNHSHSHSHSHSGGNSINNSSDL
                     ETTAIKRRKRCSRDEDATLNNNNNNSNSNNNNILPQKKRKQGPILDSPESPPPTSVHT
                     VGTVAAGIAKMTAPGGAADADQDDETLIRETQAALKSLSGSWPDARANLYRLQEQDEN
                     PPPFQNLFEEKQKYEAIAPRTPTTTATVSMFPRFHRQKENDQARLNAGATLEDRERGK
                     KLAPVTATGTALGGGPDDMDLEEAASNVYAQAASAFKPPIDFIKRNYAAAAHAHAHAQ
                     AQAHAHAHYTTSAYNASAATESAAGLAYYGYAAAAAASQQQQQQHQQHQQLSLEPTPL
                     PPRAAFDIASQLGEKPSKTSKEPLLGALPGTGTGHGGSQVDAKQYTILQPAGVGSRAA
                     SVMQDIAREGVVGVPLVATPPSTSSPPTAGGTAASTASATATLTSTSTPAPSYSPGSQ
                     NRDGAKCPTPHCTGQGHVTGLYSHHRSLSGCPKRDKVTTESDLEKHEKELHPLDKLKI
                     ASSHYLNNNNTSCINNNNNNNKLSATTMPIIKSEYSPVASIKSEYNKSPMHSYLANDA
                     AGPGPGPASSVTASASTTPGTARTASGGGATNGGGGGGGGGTTSSNGGDANLHAPHLN
                     RFVGMQSPPHPQSHHSHAHHVQQQQQQQQQQQQHTLHQQRGPFINEGNDGPDPSASYH
                     TEHQQQQQQQQQQQQQQQQAEERQYEQMRYAVGGELLSSNGGANASELSPGTARSAYE
                     AHPHPHPHPHPHPHPHPPTSLSSLSSASVGVGAPAFATVDSVSAVTVSTGAGGFERYD
                     PNCCPNGQRQVASVAGVAAASASAAAAAAAYHYLPQSADDLQVQQQKYLQEQQLMLAK
                     AEHEEQLANGGGAGPIYPRPMYHYDPTMGPLPPGFSAINLSVKMAAAQAAAAAAAYQN
                     QQQQQQQQQQQHHQQQQQQQQQQQQQQQQQQQQQQQQQQQQHGKQSSSPTPNVGGVPA
                     PAVDLSGSTSVTSSSPHGFNSPASHNQYNQRMGNGSPQPGASPNIASPQVPSPQGQTL
                     DLSVTRLPHSIITSPQYGADGLVVGHAQGFGSGAPGGALGPNGPPRSPQMEPVDFSGP
                     PRPLGFGLVGHISGPRPYSRESTPDSGGSHYIETYRDPSGYSPHPGYGMVVQSDYPPA
                     GYHGYGPAAYQCSNPYATAVGPGGYPTPVSGGYSPSPATCYSMPPPQHIPQHDKTKDG
                     LTGCSRSDRNHLQSHSQELKCPTPGCDGSGHVTGNYSSHRSLSGCPRANKPKSKPRDG
                     QDSEPLRCPIPGCDGSGHSTGKFLSHRSASGCPIANRNKMRVLEAGGTVEQHKAAVAA
                     ATAMKFDACTTVGGQGIKKPKFDEVTMVYPKGYTDYATFCIGAEYLL"
     misc_feature    2221..2304
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
     misc_feature    <3736..4443
                     /gene="LOC111066307"
                     /note="large tegument protein UL36; Provisional; Region:
                     PHA03247"
                     /db_xref="CDD:223021"
     misc_feature    4525..4611
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
     misc_feature    4660..4746
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
ORIGIN      
        1 attgctgctg ctgcgccgca cgctgctaac accgctgctt ctgtcagcgt cgacgccaac
       61 tgagctggtc gtcgcgctgc tgccgatgta aaattttatt accccaaaac gcatccagca
      121 gtcgggtttt ggacgtccgg actacaccgc cgcctcgctg agacagacga cttttattgc
      181 aattctctcg cccaagcggc gaaaaagcgg ccccagaccc agaggccaac ctctttttag
      241 agaaactaac ggacggagac agcgatacgg agatacgcag aaacgtagac acacgaagag
      301 cagcaaagaa agcacggaga acacaaaaga aaccacggag aagcacggag gccacagaga
      361 catttcaaac ttttgcgcgg catcaaagtt acgacaaaac aacaaaaaaa aaaaacaaaa
      421 aacttttcca aactacgcgc aaaactaaaa tcaactcttc cggaggtcgt gctgcttata
      481 gactagtagc cccagcccca gccccttctt ccgatccaca acaccctctt cccccacacc
      541 ccttagcacc cgattttgaa acagtgcagt gcaaacaata aataagaaac aaaacgaaca
      601 aaaacaaacc gaaatatagt ggcaacaaca attgtcccaa aaagtggaaa gttcgcggcc
      661 taattgatat tgcgtatacg cctccgatgc cgcaaaattt gtgcacgctc catcggccga
      721 tctaccaaga agaactttaa actgttaaat ccctgaagac gtcgaagcgg cgtgccgcag
      781 ccgaaccgtt gaaaaattca tacaaatttg aaccaaccaa acgaactggc ttagagcagt
      841 agagccaccc acaagatggc gctgtccaag cggccactcg ccaaggatac gcctttggca
      901 gagagcaaca gcaacaacca caaccacagc cacagtcaca gccacagcca cagcggtggc
      961 aacagcatca acaacagcag tgatctggag acgacagcta tcaagcgccg gaaacgttgc
     1021 agtcgcgatg aggatgcgac actcaacaac aacaacaaca acagtaatag caacaataac
     1081 aacatattgc cacaaaagaa acgaaaacag ggccccatac tggatagccc cgagagtcca
     1141 cctccgacaa gcgtccacac tgtcggaaca gtagccgccg gaatagccaa gatgacagct
     1201 ccgggcggcg ccgccgatgc tgatcaggat gatgagacac tcatacggga gacgcaggcg
     1261 gcattgaaga gtctgtccgg tagctggccc gatgcccggg ccaatctgta cagattgcag
     1321 gagcaggacg agaatccacc gcccttccag aatctcttcg aagagaaaca aaagtatgag
     1381 gccattgcac ccagaactcc cacaacaact gcaactgtat ccatgtttcc acgtttccac
     1441 agacagaagg agaatgacca ggcccgcctc aatgccggcg ccacgctcga ggatcgcgag
     1501 cggggcaaga agctggcccc ggtcacagca actggcacag ctctgggtgg tggaccagac
     1561 gacatggatc tggaggaggc cgccagcaat gtgtacgccc aggccgcctc ggccttcaag
     1621 ccgcccatcg acttcatcaa acgcaactat gcggccgctg cccacgccca cgcccatgcc
     1681 caggcccagg cccatgccca tgctcactac acgacaagcg cctacaatgc gtccgcagca
     1741 acagagtccg ccgccggatt ggcctactat ggctatgcgg cagccgccgc cgccagtcaa
     1801 cagcagcagc agcagcatca acagcatcag caattgagcc tggagccgac tccattgcca
     1861 ccacgggccg cctttgacat agccagccag ctgggcgaaa agccttcaaa gaccagcaag
     1921 gagccgctgt tgggagcatt gccaggaacg ggcacaggtc atggtgggtc ccaggtggat
     1981 gccaaacagt atacgatcct gcagccggca ggcgtgggca gtcgggcagc ctcagtgatg
     2041 caggacattg cccgggaggg tgttgtcggt gtacctctgg ttgccactcc accatccacg
     2101 agtagtccgc caacagcagg aggaacagca gcatcgacag catcagcgac agcgacattg
     2161 acatcgacat cgacgccggc gcctagctac tcgccgggca gccagaatcg cgatggcgcc
     2221 aaatgcccca cgccgcattg cactggccaa ggacatgtca ccggattgta ttcgcatcat
     2281 cgcagtttat cgggttgtcc gaagcgcgat aaggttacca cagaatcgga tttggagaag
     2341 cacgaaaagg agctgcatcc attggataaa ctgaagatcg cctccagtca ctatctgaac
     2401 aacaacaata ccagttgcat caacaacaat aacaataaca acaagctgag tgcaacaaca
     2461 atgcccatta tcaaatcgga gtacagtcct gtagcgagca tcaaatcgga gtacaacaaa
     2521 agcccaatgc actcatatct ggccaacgat gcagccggcc ccgggcccgg ccccgcctcc
     2581 agtgtgacgg ccagcgcatc cacaacaccg ggcaccgctc gcaccgcatc cggcggtggg
     2641 gcaactaacg gtggtggcgg tggcggtggc ggtggcacaa cctcctccaa tggtggcgat
     2701 gccaatctgc atgccccgca cctgaatcgc tttgtgggca tgcagagtcc tccccaccca
     2761 cagagccacc actcacacgc ccaccacgta cagcagcagc agcagcagca gcaacagcag
     2821 cagcaacaca cactccacca gcagcgcgga ccctttataa acgagggcaa cgacggtccc
     2881 gatccttctg ccagctacca cacggagcac cagcaacagc agcaacagca gcaacagcaa
     2941 cagcaacagc agcagcaggc cgaggagcgg cagtacgagc agatgcgcta cgccgtgggc
     3001 ggtgagctgc tgagtagcaa tgggggagcc aatgccagcg aactgtcgcc tggaacggcg
     3061 aggagtgcct acgaggcgca tccccatccg catccacacc cacatccgca tccacatccg
     3121 cacccgccca cctcgctcag ctccctcagc agcgcatcgg tgggggtggg ggcgcccgcc
     3181 tttgccacag ttgactccgt gtcggcggtg accgtttcga ctggggccgg cggcttcgag
     3241 cggtacgacc ccaactgctg tcccaatgga cagcgccagg tggcgtctgt ggcgggcgtg
     3301 gcagctgcct cagcatcggc agcggcggcg gcggcagcct atcactatct gccgcaaagc
     3361 gccgacgatc tgcaggtgca gcagcaaaag tatctgcagg agcagcagct tatgttggcc
     3421 aaggccgagc acgaggaaca gttggccaat ggcggcggtg cggggccgat atatccacgg
     3481 cccatgtacc actacgatcc caccatgggc cccctgccgc cgggcttctc cgccatcaat
     3541 ctgtccgtga aaatggccgc tgcccaagcg gccgccgccg cagccgccta tcagaaccag
     3601 cagcagcagc aacaacagca gcaacagcaa caccaccagc agcagcagca gcagcaacag
     3661 cagcaacagc agcagcagca acagcagcag cagcagcaac agcagcaaca gcaacagcag
     3721 cacggcaaac agagctcctc gcccaccccg aatgtgggag gcgtgccagc gccagcggtt
     3781 gacctatccg gatccacatc ggtgacctcc tccagtccgc acggtttcaa ttcaccagcc
     3841 tcccacaacc aatacaacca gcgcatgggc aacggcagcc cacagccggg cgccagcccc
     3901 aatatagcca gcccccaggt gcccagtccg cagggacaga ccctggacct cagcgtcacc
     3961 agactcccac acagcatcat caccagtccc cagtatgggg ccgatggcct tgtcgtgggc
     4021 catgcccagg gatttggcag cggagcgccc ggcggagctc tgggccccaa cggaccgccg
     4081 cgctccccac aaatggagcc cgtcgatttc agcggcccgc cgcgaccact aggcttcgga
     4141 ctggtcggac acatcagtgg accgcggccc tacagccgtg aatccacgcc ggacagcggc
     4201 ggttcacact acatcgagac gtacagggat cccagcggat actcgccaca tcccggatac
     4261 ggcatggtgg tgcaatcgga ctatccaccg gctggctatc atggctatgg cccagccgcg
     4321 tatcagtgca gcaatccgta tgcgacggcg gtaggacccg gcggctatcc gacgcccgtc
     4381 tccggcggct attcaccaag cccggccacc tgctactcga tgccaccgcc gcagcacata
     4441 ccgcagcacg acaagaccaa ggacggattg acgggctgct cgcgttccga ccggaatcat
     4501 ctgcaatcgc actcgcagga gctcaagtgc cccacgcccg gctgcgatgg ctctggccat
     4561 gtgaccggca actactcatc gcaccgcagc ctctccggat gtccacgggc caataaaccc
     4621 aaaagcaagc cgcgcgatgg ccaggactcg gagccgctca gatgtcccat accaggatgc
     4681 gatggctccg gtcactccac cggcaagttt ctctcccaca gaagtgcttc gggctgtccc
     4741 atagcaaatc ggaacaagat gagagtcctg gaggctgggg gcactgtgga gcagcacaag
     4801 gccgctgtgg ctgctgccac agctatgaag ttcgatgcct gcaccactgt gggtggccag
     4861 ggaatcaaga agcccaaatt cgatgaggtc accatggtct atcccaaggg ttatacagat
     4921 tacgcaacat tttgtatcgg tgccgagtat ctactgtaga tagaaaatga aactgatcaa
     4981 aaacagtccg aaatatcgaa aacctgaaac cacaaccacc aaccaaaaat aaatgaa