PREDICTED: Drosophila obscura mucin-5AC (LOC111072436), transcript


LOCUS       XM_022364309            4668 bp    mRNA    linear   INV 14-MAY-2021
            variant X1, mRNA.
ACCESSION   XM_022364309
VERSION     XM_022364309.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364309.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..4668
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..4668
                     /gene="LOC111072436"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 3 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 16 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072436"
     CDS             101..3700
                     /gene="LOC111072436"
                     /codon_start=1
                     /product="mucin-5AC isoform X1"
                     /protein_id="XP_022220001.2"
                     /db_xref="GeneID:111072436"
                     /translation="MSSPDEPGPSNGRKSRSKRRDKSVSRSSNSSSGSNFGRHSSNVV
                     NGGSLRDRLLVANAMATDETNSMVNGNDKNQRKKKKKKSSRRKSQTGLKGYSGRNPSL
                     SYLQNEISDDSDEDTRSPAEIRALCTSGLRVFPREQQTESTADSAVQAAAAAATTPDA
                     PADPASPDTDTPTSSQMSSSPSPFSRTEQTKTTIQLPTATEPSHPSIQLTTTTTTPNT
                     GISTSTIPATSSCTNLMTPVSSASPVTTLQSPTTPPSPTFSPTASANNNNSNHSSENI
                     SNHSSVASITSEPEPESRTTTTATASQQTATDLDKKDEVMIPVTDSSQLSRKRPKSRM
                     GIKTNDNNVENKAKVSAASIPPSKKKKKNQTPCVFIPRKLICGDDPLPDPLPEVAPRR
                     KSIYSDAAKKPKPNLSDELYRLPFKFGWKREVVTPSPLSNTSNHTIYTSPCGKRCRQI
                     SEIVPLLTNELTIEHFIFGTHLLGAGSEFETSRQALSREMHYAALKERRKSLAADKST
                     ASATIKVERKRRQTMGAESYPKEASASAPFGKRRKSINPAESVTEPSKPMAVESTKPL
                     AGEVAALVTGKRVPKPKVPKGASPPTEGWTSTMAVKGNARLLAAASNGNARTAGSSNA
                     SGSSNAAPVSHAKRATCGSCLKLIKGSVCQSCVRSSAREEGPNAGRIMDEYEELEEDE
                     EESEESYQAGTVSNGLKVTKMIEPPGEMPPAELFSTDKSPVTTPTDLYMPQEVVVIGG
                     RKAISIVGEPTTTSQPKVIVPNPPDLSSYEEFYGKRIAAPKQLASPTSLWGAALGEGF
                     NCHFLLSLMKTLNQQDRVNCSNVCKLWNLVSRDSDVWKSVSLRDTKVNNWPALVREMA
                     RNCTRELDMMGAIIPNTGTLIAGDMRVLTDMRTVRTNHTKADFLHQIFSGLPQLEKLI
                     GTCVSSGLIMTDIDKMENLNELRIRMTDTKASITGLPHVGKLTHLRVLSLRGVKNLGN
                     LLFLKELPNLETLNLGYCQSMHRLQLGNEVLPTLTKLQRFRLETDPRKKTSFPIDEIM
                     KGLAHAGGVRRLELVNVDVDCKFSQLLSNCNTVEELLLIPKCQTNTAVMIRSVMGISR
                     NGSQLKQFKLVLITQLLTATGAMLRNPDVPMVPVIRPIPGILLGDRLNSCSKECQEQQ
                     HDRCVAGLPFERLKIIMSELMPNSSPSVVTMAMMDTPTIQLGRLPPDATPPNF"
     misc_feature    1334..1525
                     /gene="LOC111072436"
                     /note="MeCP2, MBD1, MBD2, MBD3, MBD4, CLLD8-like, and
                     BAZ2A-like proteins constitute a family of proteins that
                     share the methyl-CpG-binding domain (MBD). The MBD
                     consists of about 70 residues and is defined as the
                     minimal region required for binding to...; Region: MBD;
                     cl00110"
                     /db_xref="CDD:469618"
     misc_feature    order(1367..1369,1373..1375,1379..1381,1400..1402,
                     1406..1408,1433..1435,1442..1444,1454..1456)
                     /gene="LOC111072436"
                     /note="DNA binding site [nucleotide binding]"
                     /db_xref="CDD:238069"
     misc_feature    <2528..2617
                     /gene="LOC111072436"
                     /note="Region: F-box-like; pfam12937"
                     /db_xref="CDD:463757"
     misc_feature    <2810..>3073
                     /gene="LOC111072436"
                     /note="Leucine-rich repeat (LRR) protein [Transcription];
                     Region: LRR; COG4886"
                     /db_xref="CDD:443914"
ORIGIN      
        1 tactgtgtac ggtgtgccgt gactttgtcc gccgcagaaa gtggttaatt ttggttaaaa
       61 tagctcaagt gttggctcaa ttttgtgtaa ttcatcagat atgagctctc ccgatgaacc
      121 tggcccttca aatggacgta agtcccgatc gaagcggcgg gataagtccg tgtcccgaag
      181 cagtaattcc agtagtgggt caaactttgg tcgacatagt agtaacgtcg tcaacggggg
      241 aagcttgaga gaccgattgc tggtggctaa cgccatggcc actgatgaaa caaacagcat
      301 ggtaaatgga aacgataaaa accagagaaa gaagaagaag aagaagtcaa gtcgacgcaa
      361 gtcacagaca ggattgaagg gatattccgg aagaaatcct tccctctcgt atttacagaa
      421 cgaaatctcc gatgactccg atgaagatac gcggtcgcca gctgaaatca gggcgctttg
      481 cacgagtggt ctgagggtat tcccccgtga acaacagaca gaatcaacgg cagactcagc
      541 agtacaggcc gctgctgctg ctgctactac tcctgatgct ccggctgatc cggctagccc
      601 ggacacggac actccgactt cttcacagat gtcatcatca ccatcaccat tctcccgcac
      661 ggagcagacg aagacaacta tccaactccc gaccgcaaca gaaccatccc atccttccat
      721 ccaactaaca acaacaacta ccactccgaa cactggaatt tcaactagca ccatcccagc
      781 aacgtcctcc tgtactaatt taatgactcc agtatcgtcc gcatcaccag taacaaccct
      841 tcagtctccg acaactcctc ccagcccaac attttcaccg acggcatcag ccaacaacaa
      901 caacagtaac cactcttcag agaacatctc aaaccactct tctgtggctt caatcacaag
      961 cgaaccagaa ccagaatcgc gaacaacaac tacagcaact gcaagtcagc aaacagcaac
     1021 agatttagac aagaaggatg aggtgatgat tcctgtcact gattccagcc aattgtcccg
     1081 aaaacgccca aagtcgagaa tgggaattaa gacaaacgac aacaacgtgg aaaacaaggc
     1141 gaaggtgtca gctgcgtcga ttcctccttc aaagaaaaag aagaagaatc agactccttg
     1201 tgttttcata cccagaaaat taatttgtgg tgatgatccg ttgcccgatc cattgccaga
     1261 ggtggcccct cgacgcaaaa gtatttactc ggatgcggcc aagaagccga agccaaattt
     1321 gtccgacgag ctctatcgtc tgccgtttaa atttggctgg aagcgtgagg tggtgactcc
     1381 cagcccactg tccaacactt cgaatcacac aatctacaca tcgccctgcg gcaagaggtg
     1441 ccgacaaatc agtgagattg taccattgct gacgaatgaa ctcaccatcg agcactttat
     1501 ctttgggacg catctcctgg gtgccggatc cgagttcgag acgagccgtc aggccttgag
     1561 cagggagatg cactatgccg ctttaaagga gcgccgcaaa tcgctggcgg ccgacaaatc
     1621 gacagcgtcg gccacaatta aggtggagcg caaacgtcgt caaacgatgg gagccgaatc
     1681 ctatccgaag gaggcatctg cctctgcgcc atttggcaaa cgtcgcaaat ccatcaatcc
     1741 agcggaatcg gtcaccgaac ccagtaagcc gatggcagtc gaatccacga aacctctggc
     1801 aggcgaagtg gcggctcttg taacaggcaa acgcgtaccc aagccgaagg tgccaaaggg
     1861 cgccagccct cccactgagg gttggacctc caccatggcc gtcaagggaa atgcgcgtct
     1921 cctggctgcc gccagcaatg gcaacgccag aactgctgga tcttcgaatg caagcggcag
     1981 ctcaaatgcc gccccggtga gccatgccaa gcgcgccacc tgtggatcct gcctaaagct
     2041 aatcaagggt agcgtttgcc agagctgcgt gcggtcgtcg gcgagggagg agggaccaaa
     2101 tgctggccgc ataatggatg aatatgaaga actggaggag gacgaggagg aaagcgagga
     2161 gagctaccag gcgggcactg tgagcaatgg gctaaaagtc acaaaaatga tcgagccgcc
     2221 cggcgagatg ccaccagcgg agctattcag cacagacaaa tccccagtga caacgccaac
     2281 tgatttatac atgccccagg aggttgtggt catcggtggg cgtaaggcga tttccatcgt
     2341 tggagaacca acgaccacaa gtcaaccaaa agttattgtg ccaaatccac cagacttgag
     2401 cagctacgaa gaattctacg gcaaacgcat tgctgcaccc aagcaattgg cttcacccac
     2461 tagcctgtgg ggagcagcgc tcggagaagg cttcaattgt cattttttgc tcagcctcat
     2521 gaagacactc aatcagcagg atcgtgtcaa ttgctcgaat gtgtgcaagt tgtggaactt
     2581 ggtctcgcgt gattctgatg tatggaaatc agtatctctg cgcgatacaa aggtcaacaa
     2641 ttggccagct ttggtgcgcg agatggcacg caactgcaca cgtgaactgg acatgatggg
     2701 tgcgattata cccaatactg ggaccctcat cgccggtgac atgcgtgtgc taacagatat
     2761 gcgcacggtg cgtaccaatc atacgaaagc cgactttctg caccagatat tcagtggctt
     2821 gccccaactt gagaagctga tcggcacatg cgtcagctcg ggcctcatca tgaccgacat
     2881 tgataagatg gagaacctga acgagctgcg cattcgaatg accgatacca aggcatcgat
     2941 caccggtctg ccccacgtgg gcaagctgac gcatctgcgt gtcctgagtc tgcgcggcgt
     3001 caagaatttg ggtaacttgc tgtttctaaa ggagttgccc aatctggaga ctctgaacct
     3061 gggctactgc cagagcatgc accgtctaca actgggcaac gaggtgctgc cgacactcac
     3121 aaaattgcag agattccgct tagaaacaga cccgcgtaag aagacctcgt tcccaatcga
     3181 cgagatcatg aagggactcg cccatgctgg tggcgtgcgt cgcctggagc tggtcaacgt
     3241 ggatgtggac tgtaaattta gccaattgct gtccaactgc aatacggtgg aggagctgct
     3301 gctgataccc aaatgtcaga ccaacacggc cgtcatgatc cgctccgtaa tgggaatcag
     3361 tcgtaatgga tctcagttaa agcaatttaa gcttgtgctt atcacccagc tgcttaccgc
     3421 aacgggcgcc atgttgcgca accccgatgt gcccatggta cccgtaatcc gtcctatacc
     3481 cggtattctg ctcggcgatc gcttgaacag ctgctccaag gaatgtcaag agcagcagca
     3541 tgacaggtgt gtggctggat tgccctttga gcgcctaaag atcataatgt cggagttgat
     3601 gccgaattcc tcaccgtcgg tggtcaccat ggccatgatg gacacaccca caatccaact
     3661 tgggcgtctg ccacccgatg ctacgccccc aaacttttga aacacacaaa aacccacact
     3721 acccctaccc ctacccccac caaccaaacc aactgaatgc acctgtaaaa gagaaagtca
     3781 agactgagtc ttcgagagcg atcacaaaaa ttttaattca cggactaaca caaattaaaa
     3841 cactaggaca agaagaagaa gaagtattac ggtcggctct attttatgtt ttcgtatttc
     3901 atgtgacgta gctgcaaagt ggctatcaat ggaaattatc tattaattat ctaatattaa
     3961 tttgacttat gcattatcct aactactgtt aactacattt aacttaggcg cgttttaaac
     4021 gctgcaccaa cgtgaagagt caactgatga ccacacaaca aaacacacaa cacacaccga
     4081 agaaagaaag aaggaaagat ctgaactcgt attcgtttag tttctaatta tctgaatgtg
     4141 tagattcata tgtataagta ttacatactg tttcaatgta atgcatcgac ttaatgtgta
     4201 tatagtactc gtactcgtac taacaataca actacactaa gagagttgtt tgcccaaagc
     4261 cagccaactg aatagatatt atttttgttt tttttttttt ttcatttaaa caaaaatcat
     4321 tatcaatatt agcgcatcaa taggtagctc ttgagagcat cttgaattga tggcgaatta
     4381 tatttaagtt cactgaactg aaagataatc aaaaaaaggg cttgggcatt ccaaaggaaa
     4441 cctaagccaa actgtggaag agttgtttag tttcactagg cccgaggcaa acaataaact
     4501 attctcgtgt atagctattg attttgtagt gtaaatatta tcaaggcaag cattttcaca
     4561 gcccacagtc ccactctgga aaatgagttt gttttgtgta ctgtggagga ctgactgggg
     4621 ctggcctttg tgtatattac tattaaaatc tgtgtgactt tctccaaa