PREDICTED: Drosophila obscura neurogenic protein mastermind


LOCUS       XM_022354800            6815 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111066307), transcript variant X2, mRNA.
ACCESSION   XM_022354800
VERSION     XM_022354800.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022354800.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..6815
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..6815
                     /gene="LOC111066307"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 2 Proteins, and 99% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 4 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111066307"
     CDS             852..5957
                     /gene="LOC111066307"
                     /codon_start=1
                     /product="neurogenic protein mastermind isoform X2"
                     /protein_id="XP_022210492.2"
                     /db_xref="GeneID:111066307"
                     /translation="MALSKRPLAKDTPLAESNSNNHNHSHSHSHSHSGGNSINNSSDL
                     ETTAIKRRKRCSRDEDATLNNNNNNSNSNNNNILPQKKRKQGPILDSPESPPPTSVHT
                     VGTVAAGIAKMTAPGGAADADQDDETLIRETQAALKSLSGSWPDARANLYRLQEQDEN
                     PPPFQNLFEEKQKQKENDQARLNAGATLEDRERGKKLAPVTATGTALGGGPDDMDLEE
                     AASNVYAQAASAFKPPIDFIKRNYAAAAHAHAHAQAQAHAHAHYTTSAYNASAATESA
                     AGLAYYGYAAAAAASQQQQQQHQQHQQLSLEPTPLPPRAAFDIASQLGEKPSKTSKEP
                     LLGALPGTGTGHGGSQVDAKQYTILQPAGVGSRAASVMQDIAREGVVGVPLVATPPST
                     SSPPTAGGTAASTASATATLTSTSTPAPSYSPGSQNRADLEKHEKELHPLDKLKIASS
                     HYLNNNNTSCINNNNNNNKLSATTMPIIKSEYSPVASIKSEYNKSPMHSYLANDAAGP
                     GPGPASSVTASASTTPGTARTASGGGATNGGGGGGGGGTTSSNGGDANLHAPHLNRFV
                     GMQSPPHPQSHHSHAHHVQQQQQQQQQQQQHTLHQQRGPFINEGNDGPDPSASYHTEH
                     QQQQQQQQQQQQQQQQAEERQYEQMRYAVGGELLSSNGGANASELSPGTARSAYEAHP
                     HPHPHPHPHPHPHPPTSLSSLSSASVGVGAPAFATVDSVSAVTVSTGAGGFERYDPNC
                     CPNGQRQVASVAGVAAASASAAAAAAAYHYLPQSADDLQVQQQKYLQEQQLMLAKAEH
                     EEQLANGGGAGPIYPRPMYHYDPTMGPLPPGFSAINLSVKMAAAQAAAAAAAYQNQQQ
                     QQQQQQQQHHQQQQQQQQQQQQQQQQQQQQQQQQQQQQHGKQSSSPTPNVGGVPAPAV
                     DLSGSTSVTSSSPHGFNSPASHNQYNQRMGNGSPQPGASPNIASPQVPSPQGQTLDLS
                     VTRLPHSIITSPQYGADGLVVGHAQGFGSGAPGGALGPNGPPRSPQMEPVDFSGPPRP
                     LGFGLVGHISGPRPYSRESTPDSGGSHYIETYRDPSGYSPHPGYGMVVQSDYPPAGYH
                     GYGPAAYQCSNPYATAVGPGGYPTPVSGGYSPSPATCYSMPPPQHIPQHDKTKDGLTG
                     CSRSDRNHLQSHSQELKCPTPGCDGSGHVTGNYSSHRSLSGCPRANKPKSKPRDGQDS
                     EPLRCPIPGCDGSGHSTGKFLSHRSASGCPIANRNKMRVLEAGGTVEQHKAAVAAATA
                     MKFDACTTVGGQGIKKPKFDEVTMVYPKGYTGGSGLDIVMSGVGSTGVGVGGLGLNVN
                     VGLGVTSSSNNSAHSSLSSSNNSNGNGNGGNNEKSGGAAAASGNGSDDLNTLEAEISE
                     LQRENARVESQMMRLKSDINAMESQLSTSDREASPLSGHQQQQRSSNVAMASPSGQSP
                     FASVSSTSGTGTGAATSSSNNNGSNDLGHSISSLTPGTGHSNPNTNVGGMMSHAPVDG
                     SVAPPNANLNNYYESLRNNVITLLEHVRLPPPPAPPTSVSVSASIAGGQLVAGHGLDS
                     VCAGGQLIAGSGGDHATAYSTLLPPPPPPPSASSGNIGGGMYGHQGGTGTGGGPPPCP
                     PPVPPHHAYTVHHPVSYAHPHSHPHGHPHGHPHGHPHPHPHEHFDSYISKLQSLCVPP
                     DVYALPDDADRTVYNSVKPSMHQDYGKLMPTPI"
     misc_feature    <3549..4256
                     /gene="LOC111066307"
                     /note="large tegument protein UL36; Provisional; Region:
                     PHA03247"
                     /db_xref="CDD:223021"
     misc_feature    4338..4424
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
     misc_feature    4473..4559
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
ORIGIN      
        1 ctgctgctgc gccgcacgct gctaacaccg ctgcttctgt cagcgtcgac gccaactgag
       61 ctggtcgtcg cgctgctgcc gatgtaaaat tttattaccc caaaacgcat ccagcagtcg
      121 ggttttggac gtccggacta caccgccgcc tcgctgagac agacgacttt tattgcaatt
      181 ctctcgccca agcggcgaaa aagcggcccc agacccagag gccaacctct ttttagagaa
      241 actaacggac ggagacagcg atacggagat acgcagaaac gtagacacac gaagagcagc
      301 aaagaaagca cggagaacac aaaagaaacc acggagaagc acggaggcca cagagacatt
      361 tcaaactttt gcgcggcatc aaagttacga caaaacaaca aaaaaaaaaa acaaaaaact
      421 tttccaaact acgcgcaaaa ctaaaatcaa ctcttccgga ggtcgtgctg cttatagact
      481 agtagcccca gccccagccc cttcttccga tccacaacac cctcttcccc cacacccctt
      541 agcacccgat tttgaaacag tgcagtgcaa acaataaata agaaacaaaa cgaacaaaaa
      601 caaaccgaaa tatagtggca acaacaattg tcccaaaaag tggaaagttc gcggcctaat
      661 tgatattgcg tatacgcctc cgatgccgca aaatttgtgc acgctccatc ggccgatcta
      721 ccaagaagaa ctttaaactg ttaaatccct gaagacgtcg aagcggcgtg ccgcagccga
      781 accgttgaaa aattcataca aatttgaacc aaccaaacga actggcttag agcagtagag
      841 ccacccacaa gatggcgctg tccaagcggc cactcgccaa ggatacgcct ttggcagaga
      901 gcaacagcaa caaccacaac cacagccaca gtcacagcca cagccacagc ggtggcaaca
      961 gcatcaacaa cagcagtgat ctggagacga cagctatcaa gcgccggaaa cgttgcagtc
     1021 gcgatgagga tgcgacactc aacaacaaca acaacaacag taatagcaac aataacaaca
     1081 tattgccaca aaagaaacga aaacagggcc ccatactgga tagccccgag agtccacctc
     1141 cgacaagcgt ccacactgtc ggaacagtag ccgccggaat agccaagatg acagctccgg
     1201 gcggcgccgc cgatgctgat caggatgatg agacactcat acgggagacg caggcggcat
     1261 tgaagagtct gtccggtagc tggcccgatg cccgggccaa tctgtacaga ttgcaggagc
     1321 aggacgagaa tccaccgccc ttccagaatc tcttcgaaga gaaacaaaaa cagaaggaga
     1381 atgaccaggc ccgcctcaat gccggcgcca cgctcgagga tcgcgagcgg ggcaagaagc
     1441 tggccccggt cacagcaact ggcacagctc tgggtggtgg accagacgac atggatctgg
     1501 aggaggccgc cagcaatgtg tacgcccagg ccgcctcggc cttcaagccg cccatcgact
     1561 tcatcaaacg caactatgcg gccgctgccc acgcccacgc ccatgcccag gcccaggccc
     1621 atgcccatgc tcactacacg acaagcgcct acaatgcgtc cgcagcaaca gagtccgccg
     1681 ccggattggc ctactatggc tatgcggcag ccgccgccgc cagtcaacag cagcagcagc
     1741 agcatcaaca gcatcagcaa ttgagcctgg agccgactcc attgccacca cgggccgcct
     1801 ttgacatagc cagccagctg ggcgaaaagc cttcaaagac cagcaaggag ccgctgttgg
     1861 gagcattgcc aggaacgggc acaggtcatg gtgggtccca ggtggatgcc aaacagtata
     1921 cgatcctgca gccggcaggc gtgggcagtc gggcagcctc agtgatgcag gacattgccc
     1981 gggagggtgt tgtcggtgta cctctggttg ccactccacc atccacgagt agtccgccaa
     2041 cagcaggagg aacagcagca tcgacagcat cagcgacagc gacattgaca tcgacatcga
     2101 cgccggcgcc tagctactcg ccgggcagcc agaatcgcgc ggatttggag aagcacgaaa
     2161 aggagctgca tccattggat aaactgaaga tcgcctccag tcactatctg aacaacaaca
     2221 ataccagttg catcaacaac aataacaata acaacaagct gagtgcaaca acaatgccca
     2281 ttatcaaatc ggagtacagt cctgtagcga gcatcaaatc ggagtacaac aaaagcccaa
     2341 tgcactcata tctggccaac gatgcagccg gccccgggcc cggccccgcc tccagtgtga
     2401 cggccagcgc atccacaaca ccgggcaccg ctcgcaccgc atccggcggt ggggcaacta
     2461 acggtggtgg cggtggcggt ggcggtggca caacctcctc caatggtggc gatgccaatc
     2521 tgcatgcccc gcacctgaat cgctttgtgg gcatgcagag tcctccccac ccacagagcc
     2581 accactcaca cgcccaccac gtacagcagc agcagcagca gcagcaacag cagcagcaac
     2641 acacactcca ccagcagcgc ggacccttta taaacgaggg caacgacggt cccgatcctt
     2701 ctgccagcta ccacacggag caccagcaac agcagcaaca gcagcaacag caacagcaac
     2761 agcagcagca ggccgaggag cggcagtacg agcagatgcg ctacgccgtg ggcggtgagc
     2821 tgctgagtag caatggggga gccaatgcca gcgaactgtc gcctggaacg gcgaggagtg
     2881 cctacgaggc gcatccccat ccgcatccac acccacatcc gcatccacat ccgcacccgc
     2941 ccacctcgct cagctccctc agcagcgcat cggtgggggt gggggcgccc gcctttgcca
     3001 cagttgactc cgtgtcggcg gtgaccgttt cgactggggc cggcggcttc gagcggtacg
     3061 accccaactg ctgtcccaat ggacagcgcc aggtggcgtc tgtggcgggc gtggcagctg
     3121 cctcagcatc ggcagcggcg gcggcggcag cctatcacta tctgccgcaa agcgccgacg
     3181 atctgcaggt gcagcagcaa aagtatctgc aggagcagca gcttatgttg gccaaggccg
     3241 agcacgagga acagttggcc aatggcggcg gtgcggggcc gatatatcca cggcccatgt
     3301 accactacga tcccaccatg ggccccctgc cgccgggctt ctccgccatc aatctgtccg
     3361 tgaaaatggc cgctgcccaa gcggccgccg ccgcagccgc ctatcagaac cagcagcagc
     3421 agcaacaaca gcagcaacag caacaccacc agcagcagca gcagcagcaa cagcagcaac
     3481 agcagcagca gcaacagcag cagcagcagc aacagcagca acagcaacag cagcacggca
     3541 aacagagctc ctcgcccacc ccgaatgtgg gaggcgtgcc agcgccagcg gttgacctat
     3601 ccggatccac atcggtgacc tcctccagtc cgcacggttt caattcacca gcctcccaca
     3661 accaatacaa ccagcgcatg ggcaacggca gcccacagcc gggcgccagc cccaatatag
     3721 ccagccccca ggtgcccagt ccgcagggac agaccctgga cctcagcgtc accagactcc
     3781 cacacagcat catcaccagt ccccagtatg gggccgatgg ccttgtcgtg ggccatgccc
     3841 agggatttgg cagcggagcg cccggcggag ctctgggccc caacggaccg ccgcgctccc
     3901 cacaaatgga gcccgtcgat ttcagcggcc cgccgcgacc actaggcttc ggactggtcg
     3961 gacacatcag tggaccgcgg ccctacagcc gtgaatccac gccggacagc ggcggttcac
     4021 actacatcga gacgtacagg gatcccagcg gatactcgcc acatcccgga tacggcatgg
     4081 tggtgcaatc ggactatcca ccggctggct atcatggcta tggcccagcc gcgtatcagt
     4141 gcagcaatcc gtatgcgacg gcggtaggac ccggcggcta tccgacgccc gtctccggcg
     4201 gctattcacc aagcccggcc acctgctact cgatgccacc gccgcagcac ataccgcagc
     4261 acgacaagac caaggacgga ttgacgggct gctcgcgttc cgaccggaat catctgcaat
     4321 cgcactcgca ggagctcaag tgccccacgc ccggctgcga tggctctggc catgtgaccg
     4381 gcaactactc atcgcaccgc agcctctccg gatgtccacg ggccaataaa cccaaaagca
     4441 agccgcgcga tggccaggac tcggagccgc tcagatgtcc cataccagga tgcgatggct
     4501 ccggtcactc caccggcaag tttctctccc acagaagtgc ttcgggctgt cccatagcaa
     4561 atcggaacaa gatgagagtc ctggaggctg ggggcactgt ggagcagcac aaggccgctg
     4621 tggctgctgc cacagctatg aagttcgatg cctgcaccac tgtgggtggc cagggaatca
     4681 agaagcccaa attcgatgag gtcaccatgg tctatcccaa gggttataca ggaggaagcg
     4741 gcctggacat tgtcatgagc ggcgtgggca gcactggggt cggcgttgga ggccttggac
     4801 tcaacgttaa tgttggcctt ggagtcacca gcagcagcaa caacagtgcc cacagcagtc
     4861 tcagcagcag caacaacagc aacggcaacg gcaacggtgg caacaacgag aagagcggag
     4921 gagcggcggc agcatccggc aatggtagcg acgatctaaa caccctggag gcggagatct
     4981 ccgagctgca gcgggagaac gcccgtgtcg aatcgcagat gatgcgactc aagtccgaca
     5041 tcaatgcgat ggagtcgcag ctgagcacca gcgatcggga ggcttctcca ttgagcggcc
     5101 atcagcaaca gcagcgctcc tccaatgtgg ccatggcttc gcccagcggt caatcgccct
     5161 tcgccagcgt tagctccacc agcggtaccg gcacaggtgc cgcaaccagc tccagcaaca
     5221 acaacggaag caacgatctg ggccactcga tcagcagtct gacgccaggc accggccaca
     5281 gcaacccaaa cacgaatgtc ggtggcatga tgtcgcatgc accggtggac gggagcgtgg
     5341 ccccgcccaa tgccaatcta aacaactact acgagagttt gcgcaacaac gtgatcacgc
     5401 tgctggagca tgtgcgcctg ccaccgccac cggcaccgcc cacttcggtc tctgtctcgg
     5461 cctcgatcgc cggcggtcag ttggtggcgg gccatggcct ggacagtgtg tgcgccgggg
     5521 gtcaactgat agccggcagc ggcggagatc acgccacggc ctactccaca ttgctgccgc
     5581 cgccgccacc gccgccatcg gccagcagcg gtaatattgg tggcggaatg tacggtcatc
     5641 agggtgggac gggtactggt ggtggcccgc caccgtgtcc accgccggtg ccgccgcatc
     5701 atgcctatac cgtgcatcat cccgtcagct atgcccaccc acactcgcat ccgcacggac
     5761 atccgcacgg ccatccgcac ggtcacccgc acccgcatcc gcacgagcac ttcgactctt
     5821 acatctccaa gctgcagtcg ctctgcgttc cgcccgatgt ctatgccctg cccgatgacg
     5881 ccgatcggac cgtctacaat tcggtgaagc caagcatgca ccaggactac ggcaaactga
     5941 tgccgacacc catctaaacg aggaggatat caaactaaca gccggtatcc agccgatgtt
     6001 ccatcccgtc cagggttcgt gagtgtgtat atatactacc caaagagtgg agaaaacaga
     6061 ctatatgtaa gaattgtggt gtggggtatt gggtacagat gctttaacct gacgaacgag
     6121 gcatctcccg agcccaagga tctttataca tatagcgcat ggatatctgt agagatctac
     6181 gtatatagcg cgtgctcctg gaaaacggac agatcctttt cctagtgtta gattgagctg
     6241 ttgcacatcc tatatcctag acgctttcgt cgtgttgata gaaactgtat aaagtattga
     6301 aacctaatga aaaaaaaaaa caaaaataat aagtgtgtaa taatattaat tcataatacg
     6361 atttacgatt aacaaatttt ttttttgtct gtatcaaata ctaaaagaaa actagaagtt
     6421 atagaagcat acataaatat agaagtagga gtttaacaac gtacatatat gttaattgta
     6481 gggcatttgt ttggtgttga tgtcttggtc aattttttgc atacaaaatg gataatgttc
     6541 ttaaatgttt aatcaacccc tccacccaca cacacacacg caaaaacccc accccacccc
     6601 agccctaaac cccaaagacc gagttctagt ccctcaaagt aagtttagtt tagagaaaaa
     6661 gtcaaacacc aaaatgtgga gataaaatga tataataaaa aacataaacg agaaaatata
     6721 ttcaatacta aagtatagag gatgtaatcg tgttacaatt tttttttttt tttgtaatat
     6781 tgaatatgaa agggcaaatg tgtgtgtaat atcaa