PREDICTED: Drosophila obscura neurogenic protein mastermind


LOCUS       XM_022354796            6885 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111066307), transcript variant X1, mRNA.
ACCESSION   XM_022354796
VERSION     XM_022354796.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022354796.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..6885
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..6885
                     /gene="LOC111066307"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 1 Protein, and 99% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     4 samples with support for all annotated introns"
                     /db_xref="GeneID:111066307"
     CDS             853..6027
                     /gene="LOC111066307"
                     /codon_start=1
                     /product="neurogenic protein mastermind isoform X1"
                     /protein_id="XP_022210488.2"
                     /db_xref="GeneID:111066307"
                     /translation="MALSKRPLAKDTPLAESNSNNHNHSHSHSHSHSGGNSINNSSDL
                     ETTAIKRRKRCSRDEDATLNNNNNNSNSNNNNILPQKKRKQGPILDSPESPPPTSVHT
                     VGTVAAGIAKMTAPGGAADADQDDETLIRETQAALKSLSGSWPDARANLYRLQEQDEN
                     PPPFQNLFEEKQKYEAIAPRTPTTTATVSMFPRFHRQKENDQARLNAGATLEDRERGK
                     KLAPVTATGTALGGGPDDMDLEEAASNVYAQAASAFKPPIDFIKRNYAAAAHAHAHAQ
                     AQAHAHAHYTTSAYNASAATESAAGLAYYGYAAAAAASQQQQQQHQQHQQLSLEPTPL
                     PPRAAFDIASQLGEKPSKTSKEPLLGALPGTGTGHGGSQVDAKQYTILQPAGVGSRAA
                     SVMQDIAREGVVGVPLVATPPSTSSPPTAGGTAASTASATATLTSTSTPAPSYSPGSQ
                     NRADLEKHEKELHPLDKLKIASSHYLNNNNTSCINNNNNNNKLSATTMPIIKSEYSPV
                     ASIKSEYNKSPMHSYLANDAAGPGPGPASSVTASASTTPGTARTASGGGATNGGGGGG
                     GGGTTSSNGGDANLHAPHLNRFVGMQSPPHPQSHHSHAHHVQQQQQQQQQQQQHTLHQ
                     QRGPFINEGNDGPDPSASYHTEHQQQQQQQQQQQQQQQQAEERQYEQMRYAVGGELLS
                     SNGGANASELSPGTARSAYEAHPHPHPHPHPHPHPHPPTSLSSLSSASVGVGAPAFAT
                     VDSVSAVTVSTGAGGFERYDPNCCPNGQRQVASVAGVAAASASAAAAAAAYHYLPQSA
                     DDLQVQQQKYLQEQQLMLAKAEHEEQLANGGGAGPIYPRPMYHYDPTMGPLPPGFSAI
                     NLSVKMAAAQAAAAAAAYQNQQQQQQQQQQQHHQQQQQQQQQQQQQQQQQQQQQQQQQ
                     QQQHGKQSSSPTPNVGGVPAPAVDLSGSTSVTSSSPHGFNSPASHNQYNQRMGNGSPQ
                     PGASPNIASPQVPSPQGQTLDLSVTRLPHSIITSPQYGADGLVVGHAQGFGSGAPGGA
                     LGPNGPPRSPQMEPVDFSGPPRPLGFGLVGHISGPRPYSRESTPDSGGSHYIETYRDP
                     SGYSPHPGYGMVVQSDYPPAGYHGYGPAAYQCSNPYATAVGPGGYPTPVSGGYSPSPA
                     TCYSMPPPQHIPQHDKTKDGLTGCSRSDRNHLQSHSQELKCPTPGCDGSGHVTGNYSS
                     HRSLSGCPRANKPKSKPRDGQDSEPLRCPIPGCDGSGHSTGKFLSHRSASGCPIANRN
                     KMRVLEAGGTVEQHKAAVAAATAMKFDACTTVGGQGIKKPKFDEVTMVYPKGYTGGSG
                     LDIVMSGVGSTGVGVGGLGLNVNVGLGVTSSSNNSAHSSLSSSNNSNGNGNGGNNEKS
                     GGAAAASGNGSDDLNTLEAEISELQRENARVESQMMRLKSDINAMESQLSTSDREASP
                     LSGHQQQQRSSNVAMASPSGQSPFASVSSTSGTGTGAATSSSNNNGSNDLGHSISSLT
                     PGTGHSNPNTNVGGMMSHAPVDGSVAPPNANLNNYYESLRNNVITLLEHVRLPPPPAP
                     PTSVSVSASIAGGQLVAGHGLDSVCAGGQLIAGSGGDHATAYSTLLPPPPPPPSASSG
                     NIGGGMYGHQGGTGTGGGPPPCPPPVPPHHAYTVHHPVSYAHPHSHPHGHPHGHPHGH
                     PHPHPHEHFDSYISKLQSLCVPPDVYALPDDADRTVYNSVKPSMHQDYGKLMPTPI"
     misc_feature    <3619..4326
                     /gene="LOC111066307"
                     /note="large tegument protein UL36; Provisional; Region:
                     PHA03247"
                     /db_xref="CDD:223021"
     misc_feature    4408..4494
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
     misc_feature    4543..4629
                     /gene="LOC111066307"
                     /note="Zinc finger, C2HC type; Region: zf-C2HC; pfam01530"
                     /db_xref="CDD:460240"
ORIGIN      
        1 gctgctgctg cgccgcacgc tgctaacacc gctgcttctg tcagcgtcga cgccaactga
       61 gctggtcgtc gcgctgctgc cgatgtaaaa ttttattacc ccaaaacgca tccagcagtc
      121 gggttttgga cgtccggact acaccgccgc ctcgctgaga cagacgactt ttattgcaat
      181 tctctcgccc aagcggcgaa aaagcggccc cagacccaga ggccaacctc tttttagaga
      241 aactaacgga cggagacagc gatacggaga tacgcagaaa cgtagacaca cgaagagcag
      301 caaagaaagc acggagaaca caaaagaaac cacggagaag cacggaggcc acagagacat
      361 ttcaaacttt tgcgcggcat caaagttacg acaaaacaac aaaaaaaaaa aacaaaaaac
      421 ttttccaaac tacgcgcaaa actaaaatca actcttccgg aggtcgtgct gcttatagac
      481 tagtagcccc agccccagcc ccttcttccg atccacaaca ccctcttccc ccacacccct
      541 tagcacccga ttttgaaaca gtgcagtgca aacaataaat aagaaacaaa acgaacaaaa
      601 acaaaccgaa atatagtggc aacaacaatt gtcccaaaaa gtggaaagtt cgcggcctaa
      661 ttgatattgc gtatacgcct ccgatgccgc aaaatttgtg cacgctccat cggccgatct
      721 accaagaaga actttaaact gttaaatccc tgaagacgtc gaagcggcgt gccgcagccg
      781 aaccgttgaa aaattcatac aaatttgaac caaccaaacg aactggctta gagcagtaga
      841 gccacccaca agatggcgct gtccaagcgg ccactcgcca aggatacgcc tttggcagag
      901 agcaacagca acaaccacaa ccacagccac agtcacagcc acagccacag cggtggcaac
      961 agcatcaaca acagcagtga tctggagacg acagctatca agcgccggaa acgttgcagt
     1021 cgcgatgagg atgcgacact caacaacaac aacaacaaca gtaatagcaa caataacaac
     1081 atattgccac aaaagaaacg aaaacagggc cccatactgg atagccccga gagtccacct
     1141 ccgacaagcg tccacactgt cggaacagta gccgccggaa tagccaagat gacagctccg
     1201 ggcggcgccg ccgatgctga tcaggatgat gagacactca tacgggagac gcaggcggca
     1261 ttgaagagtc tgtccggtag ctggcccgat gcccgggcca atctgtacag attgcaggag
     1321 caggacgaga atccaccgcc cttccagaat ctcttcgaag agaaacaaaa gtatgaggcc
     1381 attgcaccca gaactcccac aacaactgca actgtatcca tgtttccacg tttccacaga
     1441 cagaaggaga atgaccaggc ccgcctcaat gccggcgcca cgctcgagga tcgcgagcgg
     1501 ggcaagaagc tggccccggt cacagcaact ggcacagctc tgggtggtgg accagacgac
     1561 atggatctgg aggaggccgc cagcaatgtg tacgcccagg ccgcctcggc cttcaagccg
     1621 cccatcgact tcatcaaacg caactatgcg gccgctgccc acgcccacgc ccatgcccag
     1681 gcccaggccc atgcccatgc tcactacacg acaagcgcct acaatgcgtc cgcagcaaca
     1741 gagtccgccg ccggattggc ctactatggc tatgcggcag ccgccgccgc cagtcaacag
     1801 cagcagcagc agcatcaaca gcatcagcaa ttgagcctgg agccgactcc attgccacca
     1861 cgggccgcct ttgacatagc cagccagctg ggcgaaaagc cttcaaagac cagcaaggag
     1921 ccgctgttgg gagcattgcc aggaacgggc acaggtcatg gtgggtccca ggtggatgcc
     1981 aaacagtata cgatcctgca gccggcaggc gtgggcagtc gggcagcctc agtgatgcag
     2041 gacattgccc gggagggtgt tgtcggtgta cctctggttg ccactccacc atccacgagt
     2101 agtccgccaa cagcaggagg aacagcagca tcgacagcat cagcgacagc gacattgaca
     2161 tcgacatcga cgccggcgcc tagctactcg ccgggcagcc agaatcgcgc ggatttggag
     2221 aagcacgaaa aggagctgca tccattggat aaactgaaga tcgcctccag tcactatctg
     2281 aacaacaaca ataccagttg catcaacaac aataacaata acaacaagct gagtgcaaca
     2341 acaatgccca ttatcaaatc ggagtacagt cctgtagcga gcatcaaatc ggagtacaac
     2401 aaaagcccaa tgcactcata tctggccaac gatgcagccg gccccgggcc cggccccgcc
     2461 tccagtgtga cggccagcgc atccacaaca ccgggcaccg ctcgcaccgc atccggcggt
     2521 ggggcaacta acggtggtgg cggtggcggt ggcggtggca caacctcctc caatggtggc
     2581 gatgccaatc tgcatgcccc gcacctgaat cgctttgtgg gcatgcagag tcctccccac
     2641 ccacagagcc accactcaca cgcccaccac gtacagcagc agcagcagca gcagcaacag
     2701 cagcagcaac acacactcca ccagcagcgc ggacccttta taaacgaggg caacgacggt
     2761 cccgatcctt ctgccagcta ccacacggag caccagcaac agcagcaaca gcagcaacag
     2821 caacagcaac agcagcagca ggccgaggag cggcagtacg agcagatgcg ctacgccgtg
     2881 ggcggtgagc tgctgagtag caatggggga gccaatgcca gcgaactgtc gcctggaacg
     2941 gcgaggagtg cctacgaggc gcatccccat ccgcatccac acccacatcc gcatccacat
     3001 ccgcacccgc ccacctcgct cagctccctc agcagcgcat cggtgggggt gggggcgccc
     3061 gcctttgcca cagttgactc cgtgtcggcg gtgaccgttt cgactggggc cggcggcttc
     3121 gagcggtacg accccaactg ctgtcccaat ggacagcgcc aggtggcgtc tgtggcgggc
     3181 gtggcagctg cctcagcatc ggcagcggcg gcggcggcag cctatcacta tctgccgcaa
     3241 agcgccgacg atctgcaggt gcagcagcaa aagtatctgc aggagcagca gcttatgttg
     3301 gccaaggccg agcacgagga acagttggcc aatggcggcg gtgcggggcc gatatatcca
     3361 cggcccatgt accactacga tcccaccatg ggccccctgc cgccgggctt ctccgccatc
     3421 aatctgtccg tgaaaatggc cgctgcccaa gcggccgccg ccgcagccgc ctatcagaac
     3481 cagcagcagc agcaacaaca gcagcaacag caacaccacc agcagcagca gcagcagcaa
     3541 cagcagcaac agcagcagca gcaacagcag cagcagcagc aacagcagca acagcaacag
     3601 cagcacggca aacagagctc ctcgcccacc ccgaatgtgg gaggcgtgcc agcgccagcg
     3661 gttgacctat ccggatccac atcggtgacc tcctccagtc cgcacggttt caattcacca
     3721 gcctcccaca accaatacaa ccagcgcatg ggcaacggca gcccacagcc gggcgccagc
     3781 cccaatatag ccagccccca ggtgcccagt ccgcagggac agaccctgga cctcagcgtc
     3841 accagactcc cacacagcat catcaccagt ccccagtatg gggccgatgg ccttgtcgtg
     3901 ggccatgccc agggatttgg cagcggagcg cccggcggag ctctgggccc caacggaccg
     3961 ccgcgctccc cacaaatgga gcccgtcgat ttcagcggcc cgccgcgacc actaggcttc
     4021 ggactggtcg gacacatcag tggaccgcgg ccctacagcc gtgaatccac gccggacagc
     4081 ggcggttcac actacatcga gacgtacagg gatcccagcg gatactcgcc acatcccgga
     4141 tacggcatgg tggtgcaatc ggactatcca ccggctggct atcatggcta tggcccagcc
     4201 gcgtatcagt gcagcaatcc gtatgcgacg gcggtaggac ccggcggcta tccgacgccc
     4261 gtctccggcg gctattcacc aagcccggcc acctgctact cgatgccacc gccgcagcac
     4321 ataccgcagc acgacaagac caaggacgga ttgacgggct gctcgcgttc cgaccggaat
     4381 catctgcaat cgcactcgca ggagctcaag tgccccacgc ccggctgcga tggctctggc
     4441 catgtgaccg gcaactactc atcgcaccgc agcctctccg gatgtccacg ggccaataaa
     4501 cccaaaagca agccgcgcga tggccaggac tcggagccgc tcagatgtcc cataccagga
     4561 tgcgatggct ccggtcactc caccggcaag tttctctccc acagaagtgc ttcgggctgt
     4621 cccatagcaa atcggaacaa gatgagagtc ctggaggctg ggggcactgt ggagcagcac
     4681 aaggccgctg tggctgctgc cacagctatg aagttcgatg cctgcaccac tgtgggtggc
     4741 cagggaatca agaagcccaa attcgatgag gtcaccatgg tctatcccaa gggttataca
     4801 ggaggaagcg gcctggacat tgtcatgagc ggcgtgggca gcactggggt cggcgttgga
     4861 ggccttggac tcaacgttaa tgttggcctt ggagtcacca gcagcagcaa caacagtgcc
     4921 cacagcagtc tcagcagcag caacaacagc aacggcaacg gcaacggtgg caacaacgag
     4981 aagagcggag gagcggcggc agcatccggc aatggtagcg acgatctaaa caccctggag
     5041 gcggagatct ccgagctgca gcgggagaac gcccgtgtcg aatcgcagat gatgcgactc
     5101 aagtccgaca tcaatgcgat ggagtcgcag ctgagcacca gcgatcggga ggcttctcca
     5161 ttgagcggcc atcagcaaca gcagcgctcc tccaatgtgg ccatggcttc gcccagcggt
     5221 caatcgccct tcgccagcgt tagctccacc agcggtaccg gcacaggtgc cgcaaccagc
     5281 tccagcaaca acaacggaag caacgatctg ggccactcga tcagcagtct gacgccaggc
     5341 accggccaca gcaacccaaa cacgaatgtc ggtggcatga tgtcgcatgc accggtggac
     5401 gggagcgtgg ccccgcccaa tgccaatcta aacaactact acgagagttt gcgcaacaac
     5461 gtgatcacgc tgctggagca tgtgcgcctg ccaccgccac cggcaccgcc cacttcggtc
     5521 tctgtctcgg cctcgatcgc cggcggtcag ttggtggcgg gccatggcct ggacagtgtg
     5581 tgcgccgggg gtcaactgat agccggcagc ggcggagatc acgccacggc ctactccaca
     5641 ttgctgccgc cgccgccacc gccgccatcg gccagcagcg gtaatattgg tggcggaatg
     5701 tacggtcatc agggtgggac gggtactggt ggtggcccgc caccgtgtcc accgccggtg
     5761 ccgccgcatc atgcctatac cgtgcatcat cccgtcagct atgcccaccc acactcgcat
     5821 ccgcacggac atccgcacgg ccatccgcac ggtcacccgc acccgcatcc gcacgagcac
     5881 ttcgactctt acatctccaa gctgcagtcg ctctgcgttc cgcccgatgt ctatgccctg
     5941 cccgatgacg ccgatcggac cgtctacaat tcggtgaagc caagcatgca ccaggactac
     6001 ggcaaactga tgccgacacc catctaaacg aggaggatat caaactaaca gccggtatcc
     6061 agccgatgtt ccatcccgtc cagggttcgt gagtgtgtat atatactacc caaagagtgg
     6121 agaaaacaga ctatatgtaa gaattgtggt gtggggtatt gggtacagat gctttaacct
     6181 gacgaacgag gcatctcccg agcccaagga tctttataca tatagcgcat ggatatctgt
     6241 agagatctac gtatatagcg cgtgctcctg gaaaacggac agatcctttt cctagtgtta
     6301 gattgagctg ttgcacatcc tatatcctag acgctttcgt cgtgttgata gaaactgtat
     6361 aaagtattga aacctaatga aaaaaaaaaa caaaaataat aagtgtgtaa taatattaat
     6421 tcataatacg atttacgatt aacaaatttt ttttttgtct gtatcaaata ctaaaagaaa
     6481 actagaagtt atagaagcat acataaatat agaagtagga gtttaacaac gtacatatat
     6541 gttaattgta gggcatttgt ttggtgttga tgtcttggtc aattttttgc atacaaaatg
     6601 gataatgttc ttaaatgttt aatcaacccc tccacccaca cacacacacg caaaaacccc
     6661 accccacccc agccctaaac cccaaagacc gagttctagt ccctcaaagt aagtttagtt
     6721 tagagaaaaa gtcaaacacc aaaatgtgga gataaaatga tataataaaa aacataaacg
     6781 agaaaatata ttcaatacta aagtatagag gatgtaatcg tgttacaatt tttttttttt
     6841 tttgtaatat tgaatatgaa agggcaaatg tgtgtgtaat atcaa