PREDICTED: Drosophila obscura homeotic protein female sterile


LOCUS       XM_041591943            3755 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072429), transcript variant X3, mRNA.
ACCESSION   XM_041591943
VERSION     XM_041591943.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3755
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3755
                     /gene="LOC111072429"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 8 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072429"
     CDS             170..3508
                     /gene="LOC111072429"
                     /codon_start=1
                     /product="homeotic protein female sterile isoform X3"
                     /protein_id="XP_041447877.1"
                     /db_xref="GeneID:111072429"
                     /translation="MSSNEPPPRYEPPVEPVNGIVQPAVVPPVDRPGRNTNQLQFLIK
                     TVMKMIWKHHFAWPFQQPVDAKKLNLPDYHKIIKQPMDMGTIKKRLENNYYWSAKETI
                     HDFNTMFNNCYVYNKPGEDVVVMAQTLEKVFLQKIETMPKEELELEPATAKGGKKKAR
                     APATPKSGSGGGGGTGSSTGAAVANSNTGSSNSGSINKVAPSAQQLPIMGSGLAAQST
                     GAGGHGSATGSGTTSRPVSAMGGTVSSTAGGGGAPSIPPISTMPPHTVPGSTNTTTTA
                     TTMVDAIIASLRNPSQAAYPGATQAAANSSSLLDGSSSAAASAAATTAAATAAAAAAA
                     AAAAAAAAASSSGGGAGAPGTVSTAGGVTIPSVNTTTNVHSSYVNSTAGVGVGVDAVI
                     PPQQPAKMKKGVKRKADTTTPTANAFESPYAQMDSKSAKIATRRESNRQVKGKKDLTF
                     QGSGYAMSPSMGVVPGLAAGVAASVAAAKSKEKLSDALKSCNEILKELFSKKHSGYAW
                     PFYKPVDAEMLGLHDYHDIIKKPMDLGTVKRKMDNREYKSAPEFAADVRLIFTNCYKY
                     NPPDHDVVAMGRKLQDVFEMRYANIPDEPVSNAAHHHAHTHGHGHGHGHGQSHGHGHG
                     HGHGGYSSASLKHDGSDSSSEDSSGTENESNSDEERSAKLKMLESKLLGLQEEIRKLS
                     EEASAKKKAKKKLKEKKKSIGGGSGSGSASHHAHASAGGGAGGPSASHGGVSVPASVV
                     ALSAGGAAGPNLSALLSGSLVGASGAGGGVPNVSALHSLAHDMTLAMNQLTGNAAATG
                     AGFTAGIPPPGPAPGGKGANMASAMAAAGAGPGASGGTGGSSKSKSKGQRGKGSSSNA
                     GAGGASSGVTVNAGSGIGGAGAASSAGSGGGSGTTGPSGNSSKRGKGSSSAGGGGGGS
                     SGSAANTTSATGAGARGSSKKKPSQVMNFDSEEEDTAKPMSYDEKRQLSLDINKLPGD
                     KLGRVVHIIQNREPSLRDSNPDEIEIDFETLKPSTLRELESYVASCLRKKTRKPCYKK
                     PSGKSKDEQMAEKKQELEKRLQDVTGQLGASKKNAKKDDSTSNKVEAVQPANPVSSSS
                     SSSDSSSSSSSDSSSSDSSDSEAG"
     misc_feature    269..589
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat I. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_I_like; cd05497"
                     /db_xref="CDD:99929"
     misc_feature    order(356..358,377..379,386..388,503..505,515..517,
                     533..535)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99929"
     misc_feature    1631..1933
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat II. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_II_like; cd05498"
                     /db_xref="CDD:99930"
     misc_feature    order(1709..1711,1730..1732,1739..1741,1856..1858,
                     1868..1870,1886..1888)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99930"
     misc_feature    3026..3220
                     /gene="LOC111072429"
                     /note="Bromodomain extra-terminal - transcription
                     regulation; Region: BET; pfam17035"
                     /db_xref="CDD:435704"
ORIGIN      
        1 agcagcagca gcagtacaac cagcatccac ttgaggatca gataccttaa aagcaaccgc
       61 aacaggagca gggacaaaag caacaaccag aagcctcatc atcagccaac aggaggagca
      121 gcagtagccg cagcaccact gtgtcaccat catcaccatc atcaacaaca tgtcgtccaa
      181 cgaaccacca cctcgctacg agccgcctgt ggagccggtc aatggcattg tgcagccagc
      241 ggttgtgcct ccagttgatc gacccggccg caatacaaat caattgcaat tcttgatcaa
      301 aaccgtaatg aagatgatat ggaaacacca ttttgcgtgg cccttccagc agcccgtcga
      361 cgcgaaaaag ctcaacctgc ccgactacca caagatcatc aagcagccga tggacatggg
      421 aacgatcaag aagcgactgg agaacaacta ttactggtcg gcgaaggaga ccatccatga
      481 cttcaatacc atgttcaaca actgctatgt ctacaacaag cccggcgagg atgtggtcgt
      541 gatggcccag acgctggaga aggtattctt gcagaagatc gagacgatgc ccaaggagga
      601 gcttgaactg gagccggcca cggccaaggg tggcaagaag aaggcacgtg ccccggccac
      661 gcccaagtct ggatcaggag gcggaggtgg aacgggatca agcacgggtg cagctgtcgc
      721 caatagcaac actggcagca gtaacagcgg atctatcaat aaggtagcac catcggccca
      781 acagttgccc atcatgggca gcggcctggc ggcacagtca acgggtgcag gaggccatgg
      841 atcagcgacg gggtcgggga caacatcccg acccgtatca gcgatgggcg gaacggtttc
      901 atcgacggcc ggcggcggcg gtgcaccgtc cataccaccg attagcacaa tgcctccgca
      961 cacagtcccc ggcagcacca acaccacgac gacggccacg acaatggtcg acgccattat
     1021 agccagcctt cggaatccca gccaggccgc atatccgggc gctacccagg cggcggctaa
     1081 cagctcctcc ctactggacg gcagcagcag tgcggcagca tcggcggcgg caacaacagc
     1141 agcggcgacg gcagcagcag cggcagcagc agcagcagcg gcggcggcag cagcagcatc
     1201 atcatctggc ggtggagcgg gagctcccgg tacagtcagt acggcgggtg gtgtgacaat
     1261 accatccgtc aataccacca ccaatgtgca ctcctcctac gtgaacagca cggcgggcgt
     1321 cggagttggt gtggatgcgg ttataccgcc ccaacagccg gcgaaaatga agaagggtgt
     1381 caaacggaag gcggacacaa cgacgccgac ggccaatgca tttgagtcgc cctacgccca
     1441 aatggactcc aagtcggcca agatagcgac gcgaagggaa tcgaatcgtc aggtaaaggg
     1501 caaaaaggat cttacattcc agggctcggg atatgcgatg tcgccatcga tgggtgtcgt
     1561 gcctggattg gcggcgggtg tggccgctag tgtggcggcg gccaagtcaa aggagaagct
     1621 gtcggatgca ctaaagtcat gcaacgagat cctcaaggag ctgttcagca agaagcactc
     1681 gggctatgcc tggcccttct acaagccggt ggatgcggaa atgctgggcc tccatgacta
     1741 ccacgacatc atcaaaaagc ccatggacct gggcaccgtc aagcggaaaa tggacaatcg
     1801 ggagtacaag agcgcaccgg agtttgcggc cgatgtgcga ttaatattca ccaactgcta
     1861 caagtacaat ccgccagatc atgatgttgt ggccatgggc cggaagctgc aagacgtctt
     1921 cgaaatgcgc tacgccaaca tacccgacga accggtctct aatgcggccc atcatcatgc
     1981 acatacgcac ggacatgggc acggccatgg acacggccag agtcacggtc acgggcatgg
     2041 gcatgggcac ggtggctatt cgagtgcttc cctcaagcac gatggcagcg actcgtccag
     2101 cgaggactcc agcggcacag agaacgagtc gaactcggac gaggagcgca gcgccaagct
     2161 gaaaatgctc gagtccaagc tgctcggtct ccaggaggag atccgaaagc tctccgagga
     2221 ggcctccgca aagaagaagg ccaagaaaaa actcaaagag aagaagaaga gcatcggtgg
     2281 gggctctggt tccggctcgg cctctcatca tgcccatgcc tcggctggtg gtggcgcagg
     2341 tggtccgtcc gccagccatg gtggcgtctc tgttccggcc agcgtcgttg ccctatcggc
     2401 gggcggagca gcgggaccca acctatcggc cttactcagc ggttcgctgg tgggcgcgag
     2461 cggagcgggc ggcggagtgc ccaacgtctc ggcccttcat tcactcgccc acgacatgac
     2521 ccttgccatg aaccaactga cgggcaatgc ggcagcgacc ggagctggct ttacggccgg
     2581 cataccgcca ccgggaccag cgccaggcgg caagggggcc aacatggcca gcgccatggc
     2641 tgcggcggga gcgggaccag gggcttctgg gggaaccggc ggcagcagca aatcgaagag
     2701 caagggccag cgcggtaaag gaagctcgag caatgcggga gcgggcggag catcctctgg
     2761 agtgacggtc aacgcgggca gcggaatcgg cggtgctggc gcagcgtcca gcgctggcag
     2821 tggcggtggc agtgggacta ctggccccag cggcaattcc tcaaagcggg gcaagggtag
     2881 tagtagtgcc ggcggtggtg gtggcggcag cagtggcagt gcggccaata ccaccagtgc
     2941 gaccggtgcc ggagcgcgcg gtagcagcaa gaagaagccc agccaggtga tgaactttga
     3001 ctccgaggag gaggacacgg ccaagcccat gtcgtacgat gagaagcgac aactctcact
     3061 ggacatcaac aagttgccag gcgacaagct ggggcgagtg gtgcacatta tccagaatcg
     3121 ggagccatcg ctgcgggact ccaatccgga cgagatagag atcgactttg agacgctgaa
     3181 gccgtcgacg ctgcgcgagc ttgaaagcta tgtggcgtcg tgtttgcgca aaaaaacacg
     3241 taagccatgt tataaaaagc cttccggcaa atcgaaggat gagcaaatgg cggaaaagaa
     3301 gcaggagctg gagaagcggc tgcaggacgt caccggccag ctgggtgcaa gcaagaaaaa
     3361 cgccaagaaa gatgattcca cctcaaacaa agtggaagct gtgcagccag cgaatcccgt
     3421 gtcgtcgagt tccagttcca gcgattcatc gtcctcgagt tcgagtgata gcagttcgag
     3481 tgactcgagc gacagtgaag caggttagga cgcgttttgt ttgtttgttt taccttataa
     3541 cgcctttttt ttttgttagt ttatatagac atatatacgt atgcatatat atatatatat
     3601 atatatatat atataaatat gaatatatat gtatagaaac gtttttaagc agcaaataac
     3661 aaaatcgaac agatcgacga cagtaaccga cagtaactta cagcttacga aactaaaagc
     3721 gtgcggtaga ggaagaggaa tagcaaagca ggtag