PREDICTED: Drosophila obscura mucin-19 (LOC111070677), mRNA.


LOCUS       XM_022361393            2323 bp    mRNA    linear   INV 14-MAY-2021
ACCESSION   XM_022361393
VERSION     XM_022361393.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022361393.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..2323
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2323
                     /gene="LOC111070677"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 5 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111070677"
     CDS             396..1847
                     /gene="LOC111070677"
                     /codon_start=1
                     /product="mucin-19"
                     /protein_id="XP_022217085.2"
                     /db_xref="GeneID:111070677"
                     /translation="MNAKKRQRLDLGLDIDATTGGGAGAPKATAAPTTTTTTTTTATT
                     ASDLSDALLASSFGNGQSLFLTSTGNGSGGAQILLTICGDENSDESQEYYAIKQEPDM
                     DLNSLLPSNLQLPTGCEIYLVKDTTISSPMQLNGHTHTHTQTQTTHIQAQTIPPKATI
                     KLEPDSMSDRCGLTVNKLCTSSTNILYVSNGASDGKPSTNATATPERASGTPKPAVAA
                     TIAKVAAAAAAAPTTAATTTNTMRALKLIEEHVGGGGGGGGAGGAGSTASAVGTTMSG
                     TATSKLDAYKKRDDKRRATHNEVERRRRDKINCWIFKLKEMLPIEGSRYRPPPPSNGQ
                     MEPVSISLSSSTSEASTSPGLRVNQSANGRTPPNDSKSQILIKACEYIKSMQGEIDNL
                     REGLREADKLRVTNKTLRDELNSLKRQQELQERFHSNGGGSFNVTLNSLNSSATSDLF
                     DGIDGPHHGMGMSMGMGMGAFGKRGLMIADYDE"
     misc_feature    1257..1553
                     /gene="LOC111070677"
                     /note="basic Helix Loop Helix (bHLH) domain superfamily;
                     Region: bHLH_SF; cl00081"
                     /db_xref="CDD:469605"
     misc_feature    order(1293..1298,1302..1304,1317..1319,1503..1508)
                     /gene="LOC111070677"
                     /note="DNA binding site [nucleotide binding]"
                     /db_xref="CDD:381494"
     misc_feature    order(1311..1316,1323..1328,1332..1337,1347..1349,
                     1506..1511,1518..1523,1530..1532,1536..1541,1548..1553)
                     /gene="LOC111070677"
                     /note="dimer interface [polypeptide binding]; other site"
                     /db_xref="CDD:381494"
ORIGIN      
        1 atatcaatta acgtaatgaa gcccaaacaa tcgttgttgt taacaattcg tgttgttaaa
       61 tggcaacgca aatgcgtcaa aagtcgccgt tgagccctct aatcgcgaag aacctggtgg
      121 ccaaacatca ccgcggcagt taatatccaa aatcaaggcg ggcatacagc aacaagcatt
      181 gctgcattcg cagcgcagaa gagtgccagg ccaagtgcca gcgcgactcg ggcctgggga
      241 gccacaaact ccaattggac cgatcccatt cgatccgatt cccaacccga ttagagttac
      301 gtgagctggg cgctggagaa agtatacgaa aaccgagtaa caaaagcaga tttcgttgcc
      361 tgccagatga caacagtcga acgtccgttg acgctatgaa cgccaagaaa cgtcaacgcc
      421 tggacctggg gctggacatt gatgccacaa caggaggagg agcaggtgca ccaaaagcaa
      481 ctgccgctcc aacgaccaca acaacaacaa caacaacagc aacgactgca agtgacttat
      541 ccgatgcttt gttggccagt tcgtttggca acggccagag cctgttcctg accagcaccg
      601 gcaatggcag tggcggtgcc cagatcctat tgaccatctg cggtgacgag aactcggatg
      661 agtcgcagga gtattatgcc atcaagcagg agcccgatat ggatttgaac tcgctgctgc
      721 caagcaacct acagctgccc actggctgtg agatatatct ggtgaaggac accaccatca
      781 gttcgcccat gcagctcaat ggacataccc atacccatac acagacccag acgacccaca
      841 ttcaagccca gaccattcca ccaaaggcaa ccatcaaact ggagccggat tcgatgagcg
      901 accgctgtgg tctcactgta aataagctct gcacatcgtc cacgaacatc ctctacgtga
      961 gtaatggcgc cagtgacggg aagccctcca caaatgcgac tgcaacgcca gagagagcat
     1021 caggcacacc aaaaccagct gtggcggcaa cgatagccaa agtggccgcc gccgccgccg
     1081 ccgcacccac aacagccgcc acaactacaa acacaatgcg tgctctaaaa ctaatcgagg
     1141 agcatgtggg tggaggagga ggaggaggtg gagcaggggg tgctggtagc acggccagtg
     1201 cggttggtac aacgatgtct ggcactgcca cctccaaatt ggatgcgtac aagaagcggg
     1261 acgacaagcg tcgtgccacg cacaatgagg tggagcgtag acgtcgcgac aaaatcaatt
     1321 gctggatctt caagctgaag gagatgctgc ccatcgaggg cagccgctac cggccaccgc
     1381 caccaagcaa tgggcaaatg gagccggtga gcataagcct cagttcgagc accagcgagg
     1441 ccagcaccag tcccggcctg agagtcaacc agagcgccaa tggacggacg ccgcccaacg
     1501 actccaagtc gcagatattg atcaaggcct gtgagtacat caagagcatg cagggcgaga
     1561 tagacaactt acgcgagggc ctgcgtgagg cggacaagct gcgtgtgacc aataagacgc
     1621 tgcgggatga gctgaacagc ttgaagcgac agcaggagct gcaggagcgc ttccacagca
     1681 acggcggtgg atcgtttaat gtgacactga attcgttgaa tagctcggct accagtgacc
     1741 tgttcgatgg catagatggg ccacaccatg gcatgggcat gagcatgggc atgggcatgg
     1801 gggcctttgg caagcgcggt ctcatgatag ccgattacga tgaatagaat atatacggta
     1861 taggaggggt tttggcgcta gcgctggcgc tgggtcgtcc cccgccgaac caccatacac
     1921 cgccccagcc tcaaacatcc tccaaagaat gacgtaccac acgtaccacg tacaataaaa
     1981 acaaattgga aagacaagtg atttttcttg ttatcgctgt taaataatta aatatatata
     2041 tatatatagg aaaaaaaact acatatatta taaattaatg tataattagt tttttttatt
     2101 gattgttttg tttgaagcac acggatcctc attttacaat tgtttgccat gtcaactttt
     2161 agtgctgttt gccataaacc taaactaacc tcggcatccc ccttccatat agtaactata
     2221 atattaatga aaccgttact taagcatcac aatttatgcc attttttcca catttacaag
     2281 aaacattatt atatacctgt ccctccccct aaaaaaatat atg