PREDICTED: Drosophila obscura mucin-5AC (LOC111070658), mRNA.


LOCUS       XM_022361366            1275 bp    mRNA    linear   INV 14-MAY-2021
ACCESSION   XM_022361366
VERSION     XM_022361366.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022361366.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..1275
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..1275
                     /gene="LOC111070658"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 1 Protein, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 6 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111070658"
     CDS             33..1256
                     /gene="LOC111070658"
                     /codon_start=1
                     /product="mucin-5AC"
                     /protein_id="XP_022217058.2"
                     /db_xref="GeneID:111070658"
                     /translation="MALGALLLALNVEAAAARKSFSLGNWRFNDPHYSSAQYAKILAD
                     NGIGHDQDPAEKGASAGAVAAAGADGVERGMGPLQIKYVDYQPHCASGGVPVCATNGT
                     DHFYFENDCRLEAHNMKMLFQYGTELEPTELERCLPTCRTMKCTKVQRPVCALAEIGG
                     EGSGAQAPITFPNECEVRRHECQSKQAMRILHAGPCSPPPVKGRRKKKLRRSKGKRPV
                     SAAGTGTDRPKVYVMLAQPLTRKSTTSTTTTTMPAMPTMPTMPIASSTATPLRFRQLI
                     NSGNPMVSVSRAMDAYSVYNIDDVGYDYGEITDSTLSLFVPGVGRVTDAYPTTTTTTT
                     TPKAETLTPMPMPVITTTTASPTVWTSSTTSTWITTESSEHSSSSTAATTEASDSLSY
                     DPTSDSSAADRAEPL"
     misc_feature    465..620
                     /gene="LOC111070658"
                     /note="Kazal type serine protease inhibitors and
                     follistatin-like domains. Kazal inhibitors inhibit serine
                     proteases, such as, trypsin, chyomotrypsin, avian
                     ovomucoids, and elastases. The inhibitory domain has one
                     reactive site peptide bond, which serves the...; Region:
                     KAZAL_FS; cd00104"
                     /db_xref="CDD:238052"
ORIGIN      
        1 cacatcagaa gcgagaagtc gtccagcgaa taatggcctt gggcgccctg ctactggccc
       61 taaacgtcga ggctgctgcg gcgagaaagt ccttttcgct tgggaactgg cgtttcaatg
      121 atccccacta ctccagtgcc cagtatgcca agatactggc ggataatggc attggccacg
      181 accaggaccc cgcggagaag ggtgccagtg caggcgcggt tgcagctgca ggtgcagatg
      241 gagttgagag gggtatgggt cccctgcaga tcaagtacgt cgactaccag ccacactgcg
      301 cgtcgggcgg tgtgcccgtc tgcgccacga atggcacgga tcacttctac ttcgagaacg
      361 actgccgctt ggaggcgcac aacatgaaga tgctgttcca gtacggcaca gagctggagc
      421 ccacggagct ggagcgatgc ctgccaactt gccggaccat gaagtgcacg aaggtccagc
      481 ggcccgtctg tgccctggcc gagatcggag gagaaggcag cggcgctcag gcacccatta
      541 cattccccaa tgagtgtgag gtgcgacggc acgagtgcca gagcaaacaa gctatgcgta
      601 tcctgcatgc cggaccctgc tctccgcccc cagtcaaggg caggcgcaag aagaagttgc
      661 gccgcagcaa gggaaagcgg ccagtatccg cagcaggaac aggtacagat cgtcccaagg
      721 tttatgtgat gctggcccag ccattgacaa ggaaaagcac gacgagtacg acgacgacaa
      781 cgatgccagc gatgccaacg atgccaacga tgccgatcgc cagcagtact gcgactccac
      841 tgcgattccg tcagctgatt aactccggca atccgatggt atccgtgtcg cgtgccatgg
      901 acgcctacag tgtctacaat atagacgatg tgggctacga ctatggcgag atcaccgact
      961 cgacgctctc gctctttgtg cccggcgtgg gccgggtaac cgatgcatat cccaccacca
     1021 caacgaccac cacaacaccg aaggcagaaa cgttgacgcc catgcccatg ccagtcatta
     1081 ccacgacgac ggcttcccca accgtgtgga ccagcagcac cacctccaca tggatcacca
     1141 ccgaaagctc ggagcacagc agcagcagca cagcagcaac cacagaggct tccgatagcc
     1201 tcagctatga cccaaccagc gattcatctg cagcggatag agcagagcca ctttaaggga
     1261 taaagaacat ttata