PREDICTED: Drosophila obscura mucin-5AC (LOC111072436), transcript


LOCUS       XM_022364310            4086 bp    mRNA    linear   INV 14-MAY-2021
            variant X2, mRNA.
ACCESSION   XM_022364310
VERSION     XM_022364310.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364310.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..4086
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..4086
                     /gene="LOC111072436"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 3 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 12 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072436"
     CDS             101..3118
                     /gene="LOC111072436"
                     /codon_start=1
                     /product="uncharacterized protein LOC111072436 isoform X2"
                     /protein_id="XP_022220002.2"
                     /db_xref="GeneID:111072436"
                     /translation="MSSPDEPGPSNGRKSRSKRRDKSVSRSSNSSSGSNFGRHSSNVV
                     NGGSLRDRLLVANAMATDETNSMVNGNDKNQRKKKKKKSSRRKSQTGLKGYSGRNPSL
                     SYLQNEISDDSDEDTRDEVMIPVTDSSQLSRKRPKSRMGIKTNDNNVENKAKVSAASI
                     PPSKKKKKNQTPCVFIPRKLICGDDPLPDPLPEVAPRRKSIYSDAAKKPKPNLSDELY
                     RLPFKFGWKREVVTPSPLSNTSNHTIYTSPCGKRCRQISEIVPLLTNELTIEHFIFGT
                     HLLGAGSEFETSRQALSREMHYAALKERRKSLAADKSTASATIKVERKRRQTMGAESY
                     PKEASASAPFGKRRKSINPAESVTEPSKPMAVESTKPLAGEVAALVTGKRVPKPKVPK
                     GASPPTEGWTSTMAVKGNARLLAAASNGNARTAGSSNASGSSNAAPVSHAKRATCGSC
                     LKLIKGSVCQSCVRSSAREEGPNAGRIMDEYEELEEDEEESEESYQAGTVSNGLKVTK
                     MIEPPGEMPPAELFSTDKSPVTTPTDLYMPQEVVVIGGRKAISIVGEPTTTSQPKVIV
                     PNPPDLSSYEEFYGKRIAAPKQLASPTSLWGAALGEGFNCHFLLSLMKTLNQQDRVNC
                     SNVCKLWNLVSRDSDVWKSVSLRDTKVNNWPALVREMARNCTRELDMMGAIIPNTGTL
                     IAGDMRVLTDMRTVRTNHTKADFLHQIFSGLPQLEKLIGTCVSSGLIMTDIDKMENLN
                     ELRIRMTDTKASITGLPHVGKLTHLRVLSLRGVKNLGNLLFLKELPNLETLNLGYCQS
                     MHRLQLGNEVLPTLTKLQRFRLETDPRKKTSFPIDEIMKGLAHAGGVRRLELVNVDVD
                     CKFSQLLSNCNTVEELLLIPKCQTNTAVMIRSVMGISRNGSQLKQFKLVLITQLLTAT
                     GAMLRNPDVPMVPVIRPIPGILLGDRLNSCSKECQEQQHDRCVAGLPFERLKIIMSEL
                     MPNSSPSVVTMAMMDTPTIQLGRLPPDATPPNF"
     misc_feature    752..943
                     /gene="LOC111072436"
                     /note="MeCP2, MBD1, MBD2, MBD3, MBD4, CLLD8-like, and
                     BAZ2A-like proteins constitute a family of proteins that
                     share the methyl-CpG-binding domain (MBD). The MBD
                     consists of about 70 residues and is defined as the
                     minimal region required for binding to...; Region: MBD;
                     cl00110"
                     /db_xref="CDD:469618"
     misc_feature    order(785..787,791..793,797..799,818..820,824..826,
                     851..853,860..862,872..874)
                     /gene="LOC111072436"
                     /note="DNA binding site [nucleotide binding]"
                     /db_xref="CDD:238069"
     misc_feature    <1946..2035
                     /gene="LOC111072436"
                     /note="Region: F-box-like; pfam12937"
                     /db_xref="CDD:463757"
     misc_feature    <2228..>2491
                     /gene="LOC111072436"
                     /note="Leucine-rich repeat (LRR) protein [Transcription];
                     Region: LRR; COG4886"
                     /db_xref="CDD:443914"
ORIGIN      
        1 tactgtgtac ggtgtgccgt gactttgtcc gccgcagaaa gtggttaatt ttggttaaaa
       61 tagctcaagt gttggctcaa ttttgtgtaa ttcatcagat atgagctctc ccgatgaacc
      121 tggcccttca aatggacgta agtcccgatc gaagcggcgg gataagtccg tgtcccgaag
      181 cagtaattcc agtagtgggt caaactttgg tcgacatagt agtaacgtcg tcaacggggg
      241 aagcttgaga gaccgattgc tggtggctaa cgccatggcc actgatgaaa caaacagcat
      301 ggtaaatgga aacgataaaa accagagaaa gaagaagaag aagaagtcaa gtcgacgcaa
      361 gtcacagaca ggattgaagg gatattccgg aagaaatcct tccctctcgt atttacagaa
      421 cgaaatctcc gatgactccg atgaagatac gcgggatgag gtgatgattc ctgtcactga
      481 ttccagccaa ttgtcccgaa aacgcccaaa gtcgagaatg ggaattaaga caaacgacaa
      541 caacgtggaa aacaaggcga aggtgtcagc tgcgtcgatt cctccttcaa agaaaaagaa
      601 gaagaatcag actccttgtg ttttcatacc cagaaaatta atttgtggtg atgatccgtt
      661 gcccgatcca ttgccagagg tggcccctcg acgcaaaagt atttactcgg atgcggccaa
      721 gaagccgaag ccaaatttgt ccgacgagct ctatcgtctg ccgtttaaat ttggctggaa
      781 gcgtgaggtg gtgactccca gcccactgtc caacacttcg aatcacacaa tctacacatc
      841 gccctgcggc aagaggtgcc gacaaatcag tgagattgta ccattgctga cgaatgaact
      901 caccatcgag cactttatct ttgggacgca tctcctgggt gccggatccg agttcgagac
      961 gagccgtcag gccttgagca gggagatgca ctatgccgct ttaaaggagc gccgcaaatc
     1021 gctggcggcc gacaaatcga cagcgtcggc cacaattaag gtggagcgca aacgtcgtca
     1081 aacgatggga gccgaatcct atccgaagga ggcatctgcc tctgcgccat ttggcaaacg
     1141 tcgcaaatcc atcaatccag cggaatcggt caccgaaccc agtaagccga tggcagtcga
     1201 atccacgaaa cctctggcag gcgaagtggc ggctcttgta acaggcaaac gcgtacccaa
     1261 gccgaaggtg ccaaagggcg ccagccctcc cactgagggt tggacctcca ccatggccgt
     1321 caagggaaat gcgcgtctcc tggctgccgc cagcaatggc aacgccagaa ctgctggatc
     1381 ttcgaatgca agcggcagct caaatgccgc cccggtgagc catgccaagc gcgccacctg
     1441 tggatcctgc ctaaagctaa tcaagggtag cgtttgccag agctgcgtgc ggtcgtcggc
     1501 gagggaggag ggaccaaatg ctggccgcat aatggatgaa tatgaagaac tggaggagga
     1561 cgaggaggaa agcgaggaga gctaccaggc gggcactgtg agcaatgggc taaaagtcac
     1621 aaaaatgatc gagccgcccg gcgagatgcc accagcggag ctattcagca cagacaaatc
     1681 cccagtgaca acgccaactg atttatacat gccccaggag gttgtggtca tcggtgggcg
     1741 taaggcgatt tccatcgttg gagaaccaac gaccacaagt caaccaaaag ttattgtgcc
     1801 aaatccacca gacttgagca gctacgaaga attctacggc aaacgcattg ctgcacccaa
     1861 gcaattggct tcacccacta gcctgtgggg agcagcgctc ggagaaggct tcaattgtca
     1921 ttttttgctc agcctcatga agacactcaa tcagcaggat cgtgtcaatt gctcgaatgt
     1981 gtgcaagttg tggaacttgg tctcgcgtga ttctgatgta tggaaatcag tatctctgcg
     2041 cgatacaaag gtcaacaatt ggccagcttt ggtgcgcgag atggcacgca actgcacacg
     2101 tgaactggac atgatgggtg cgattatacc caatactggg accctcatcg ccggtgacat
     2161 gcgtgtgcta acagatatgc gcacggtgcg taccaatcat acgaaagccg actttctgca
     2221 ccagatattc agtggcttgc cccaacttga gaagctgatc ggcacatgcg tcagctcggg
     2281 cctcatcatg accgacattg ataagatgga gaacctgaac gagctgcgca ttcgaatgac
     2341 cgataccaag gcatcgatca ccggtctgcc ccacgtgggc aagctgacgc atctgcgtgt
     2401 cctgagtctg cgcggcgtca agaatttggg taacttgctg tttctaaagg agttgcccaa
     2461 tctggagact ctgaacctgg gctactgcca gagcatgcac cgtctacaac tgggcaacga
     2521 ggtgctgccg acactcacaa aattgcagag attccgctta gaaacagacc cgcgtaagaa
     2581 gacctcgttc ccaatcgacg agatcatgaa gggactcgcc catgctggtg gcgtgcgtcg
     2641 cctggagctg gtcaacgtgg atgtggactg taaatttagc caattgctgt ccaactgcaa
     2701 tacggtggag gagctgctgc tgatacccaa atgtcagacc aacacggccg tcatgatccg
     2761 ctccgtaatg ggaatcagtc gtaatggatc tcagttaaag caatttaagc ttgtgcttat
     2821 cacccagctg cttaccgcaa cgggcgccat gttgcgcaac cccgatgtgc ccatggtacc
     2881 cgtaatccgt cctatacccg gtattctgct cggcgatcgc ttgaacagct gctccaagga
     2941 atgtcaagag cagcagcatg acaggtgtgt ggctggattg ccctttgagc gcctaaagat
     3001 cataatgtcg gagttgatgc cgaattcctc accgtcggtg gtcaccatgg ccatgatgga
     3061 cacacccaca atccaacttg ggcgtctgcc acccgatgct acgcccccaa acttttgaaa
     3121 cacacaaaaa cccacactac ccctacccct acccccacca accaaaccaa ctgaatgcac
     3181 ctgtaaaaga gaaagtcaag actgagtctt cgagagcgat cacaaaaatt ttaattcacg
     3241 gactaacaca aattaaaaca ctaggacaag aagaagaaga agtattacgg tcggctctat
     3301 tttatgtttt cgtatttcat gtgacgtagc tgcaaagtgg ctatcaatgg aaattatcta
     3361 ttaattatct aatattaatt tgacttatgc attatcctaa ctactgttaa ctacatttaa
     3421 cttaggcgcg ttttaaacgc tgcaccaacg tgaagagtca actgatgacc acacaacaaa
     3481 acacacaaca cacaccgaag aaagaaagaa ggaaagatct gaactcgtat tcgtttagtt
     3541 tctaattatc tgaatgtgta gattcatatg tataagtatt acatactgtt tcaatgtaat
     3601 gcatcgactt aatgtgtata tagtactcgt actcgtacta acaatacaac tacactaaga
     3661 gagttgtttg cccaaagcca gccaactgaa tagatattat ttttgttttt tttttttttt
     3721 catttaaaca aaaatcatta tcaatattag cgcatcaata ggtagctctt gagagcatct
     3781 tgaattgatg gcgaattata tttaagttca ctgaactgaa agataatcaa aaaaagggct
     3841 tgggcattcc aaaggaaacc taagccaaac tgtggaagag ttgtttagtt tcactaggcc
     3901 cgaggcaaac aataaactat tctcgtgtat agctattgat tttgtagtgt aaatattatc
     3961 aaggcaagca ttttcacagc ccacagtccc actctggaaa atgagtttgt tttgtgtact
     4021 gtggaggact gactggggct ggcctttgtg tatattacta ttaaaatctg tgtgactttc
     4081 tccaaa