PREDICTED: Drosophila obscura homeotic protein female sterile


LOCUS       XM_041591944            3740 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072429), transcript variant X4, mRNA.
ACCESSION   XM_041591944
VERSION     XM_041591944.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3740
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3740
                     /gene="LOC111072429"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 9 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072429"
     CDS             170..3493
                     /gene="LOC111072429"
                     /codon_start=1
                     /product="homeotic protein female sterile isoform X4"
                     /protein_id="XP_041447878.1"
                     /db_xref="GeneID:111072429"
                     /translation="MSSNEPPPRYEPPVEPVNGIVQPAVVPPVDRPGRNTNQLQFLIK
                     TVMKMIWKHHFAWPFQQPVDAKKLNLPDYHKIIKQPMDMGTIKKRLENNYYWSAKETI
                     HDFNTMFNNCYVYNKPGEDVVVMAQTLEKVFLQKIETMPKEELELEPATAKGGKKKAR
                     APATPKSGSGGGGGTGSSTGAAVANSNTGSSNSGSINKVAPSAQQLPIMGSGLAAQST
                     GAGGHGSATGSGTTSRPVSAMGGTVSSTAGGGGAPSIPPISTMPPHTVPGSTNTTTTA
                     TTMVDAIIASLRNPSQAAYPGATQAAANSSSLLDGSSSAAASAAATTAAATAAAAAAA
                     AAAAAAAAASSSGGGAGAPGTVSTAGGVTIPSVNTTTNVHSSYVNSTAGVGVGVDAVI
                     PPQQPAKMKKGVKRKADTTTPTANAFESPYAQMDSKSAKIATRRESNRQDLTFQGSGY
                     AMSPSMGVVPGLAAGVAASVAAAKSKEKLSDALKSCNEILKELFSKKHSGYAWPFYKP
                     VDAEMLGLHDYHDIIKKPMDLGTVKRKMDNREYKSAPEFAADVRLIFTNCYKYNPPDH
                     DVVAMGRKLQDVFEMRYANIPDEPVSNAAHHHAHTHGHGHGHGHGQSHGHGHGHGHGG
                     YSSASLKHDGSDSSSEDSSGTENESNSDEERSAKLKMLESKLLGLQEEIRKLSEEASA
                     KKKAKKKLKEKKKSIGGGSGSGSASHHAHASAGGGAGGPSASHGGVSVPASVVALSAG
                     GAAGPNLSALLSGSLVGASGAGGGVPNVSALHSLAHDMTLAMNQLTGNAAATGAGFTA
                     GIPPPGPAPGGKGANMASAMAAAGAGPGASGGTGGSSKSKSKGQRGKGSSSNAGAGGA
                     SSGVTVNAGSGIGGAGAASSAGSGGGSGTTGPSGNSSKRGKGSSSAGGGGGGSSGSAA
                     NTTSATGAGARGSSKKKPSQVMNFDSEEEDTAKPMSYDEKRQLSLDINKLPGDKLGRV
                     VHIIQNREPSLRDSNPDEIEIDFETLKPSTLRELESYVASCLRKKTRKPCYKKPSGKS
                     KDEQMAEKKQELEKRLQDVTGQLGASKKNAKKDDSTSNKVEAVQPANPVSSSSSSSDS
                     SSSSSSDSSSSDSSDSEAG"
     misc_feature    269..589
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat I. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_I_like; cd05497"
                     /db_xref="CDD:99929"
     misc_feature    order(356..358,377..379,386..388,503..505,515..517,
                     533..535)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99929"
     misc_feature    1616..1918
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat II. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_II_like; cd05498"
                     /db_xref="CDD:99930"
     misc_feature    order(1694..1696,1715..1717,1724..1726,1841..1843,
                     1853..1855,1871..1873)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99930"
     misc_feature    3011..3205
                     /gene="LOC111072429"
                     /note="Bromodomain extra-terminal - transcription
                     regulation; Region: BET; pfam17035"
                     /db_xref="CDD:435704"
ORIGIN      
        1 agcagcagca gcagtacaac cagcatccac ttgaggatca gataccttaa aagcaaccgc
       61 aacaggagca gggacaaaag caacaaccag aagcctcatc atcagccaac aggaggagca
      121 gcagtagccg cagcaccact gtgtcaccat catcaccatc atcaacaaca tgtcgtccaa
      181 cgaaccacca cctcgctacg agccgcctgt ggagccggtc aatggcattg tgcagccagc
      241 ggttgtgcct ccagttgatc gacccggccg caatacaaat caattgcaat tcttgatcaa
      301 aaccgtaatg aagatgatat ggaaacacca ttttgcgtgg cccttccagc agcccgtcga
      361 cgcgaaaaag ctcaacctgc ccgactacca caagatcatc aagcagccga tggacatggg
      421 aacgatcaag aagcgactgg agaacaacta ttactggtcg gcgaaggaga ccatccatga
      481 cttcaatacc atgttcaaca actgctatgt ctacaacaag cccggcgagg atgtggtcgt
      541 gatggcccag acgctggaga aggtattctt gcagaagatc gagacgatgc ccaaggagga
      601 gcttgaactg gagccggcca cggccaaggg tggcaagaag aaggcacgtg ccccggccac
      661 gcccaagtct ggatcaggag gcggaggtgg aacgggatca agcacgggtg cagctgtcgc
      721 caatagcaac actggcagca gtaacagcgg atctatcaat aaggtagcac catcggccca
      781 acagttgccc atcatgggca gcggcctggc ggcacagtca acgggtgcag gaggccatgg
      841 atcagcgacg gggtcgggga caacatcccg acccgtatca gcgatgggcg gaacggtttc
      901 atcgacggcc ggcggcggcg gtgcaccgtc cataccaccg attagcacaa tgcctccgca
      961 cacagtcccc ggcagcacca acaccacgac gacggccacg acaatggtcg acgccattat
     1021 agccagcctt cggaatccca gccaggccgc atatccgggc gctacccagg cggcggctaa
     1081 cagctcctcc ctactggacg gcagcagcag tgcggcagca tcggcggcgg caacaacagc
     1141 agcggcgacg gcagcagcag cggcagcagc agcagcagcg gcggcggcag cagcagcatc
     1201 atcatctggc ggtggagcgg gagctcccgg tacagtcagt acggcgggtg gtgtgacaat
     1261 accatccgtc aataccacca ccaatgtgca ctcctcctac gtgaacagca cggcgggcgt
     1321 cggagttggt gtggatgcgg ttataccgcc ccaacagccg gcgaaaatga agaagggtgt
     1381 caaacggaag gcggacacaa cgacgccgac ggccaatgca tttgagtcgc cctacgccca
     1441 aatggactcc aagtcggcca agatagcgac gcgaagggaa tcgaatcgtc aggatcttac
     1501 attccagggc tcgggatatg cgatgtcgcc atcgatgggt gtcgtgcctg gattggcggc
     1561 gggtgtggcc gctagtgtgg cggcggccaa gtcaaaggag aagctgtcgg atgcactaaa
     1621 gtcatgcaac gagatcctca aggagctgtt cagcaagaag cactcgggct atgcctggcc
     1681 cttctacaag ccggtggatg cggaaatgct gggcctccat gactaccacg acatcatcaa
     1741 aaagcccatg gacctgggca ccgtcaagcg gaaaatggac aatcgggagt acaagagcgc
     1801 accggagttt gcggccgatg tgcgattaat attcaccaac tgctacaagt acaatccgcc
     1861 agatcatgat gttgtggcca tgggccggaa gctgcaagac gtcttcgaaa tgcgctacgc
     1921 caacataccc gacgaaccgg tctctaatgc ggcccatcat catgcacata cgcacggaca
     1981 tgggcacggc catggacacg gccagagtca cggtcacggg catgggcatg ggcacggtgg
     2041 ctattcgagt gcttccctca agcacgatgg cagcgactcg tccagcgagg actccagcgg
     2101 cacagagaac gagtcgaact cggacgagga gcgcagcgcc aagctgaaaa tgctcgagtc
     2161 caagctgctc ggtctccagg aggagatccg aaagctctcc gaggaggcct ccgcaaagaa
     2221 gaaggccaag aaaaaactca aagagaagaa gaagagcatc ggtgggggct ctggttccgg
     2281 ctcggcctct catcatgccc atgcctcggc tggtggtggc gcaggtggtc cgtccgccag
     2341 ccatggtggc gtctctgttc cggccagcgt cgttgcccta tcggcgggcg gagcagcggg
     2401 acccaaccta tcggccttac tcagcggttc gctggtgggc gcgagcggag cgggcggcgg
     2461 agtgcccaac gtctcggccc ttcattcact cgcccacgac atgacccttg ccatgaacca
     2521 actgacgggc aatgcggcag cgaccggagc tggctttacg gccggcatac cgccaccggg
     2581 accagcgcca ggcggcaagg gggccaacat ggccagcgcc atggctgcgg cgggagcggg
     2641 accaggggct tctgggggaa ccggcggcag cagcaaatcg aagagcaagg gccagcgcgg
     2701 taaaggaagc tcgagcaatg cgggagcggg cggagcatcc tctggagtga cggtcaacgc
     2761 gggcagcgga atcggcggtg ctggcgcagc gtccagcgct ggcagtggcg gtggcagtgg
     2821 gactactggc cccagcggca attcctcaaa gcggggcaag ggtagtagta gtgccggcgg
     2881 tggtggtggc ggcagcagtg gcagtgcggc caataccacc agtgcgaccg gtgccggagc
     2941 gcgcggtagc agcaagaaga agcccagcca ggtgatgaac tttgactccg aggaggagga
     3001 cacggccaag cccatgtcgt acgatgagaa gcgacaactc tcactggaca tcaacaagtt
     3061 gccaggcgac aagctggggc gagtggtgca cattatccag aatcgggagc catcgctgcg
     3121 ggactccaat ccggacgaga tagagatcga ctttgagacg ctgaagccgt cgacgctgcg
     3181 cgagcttgaa agctatgtgg cgtcgtgttt gcgcaaaaaa acacgtaagc catgttataa
     3241 aaagccttcc ggcaaatcga aggatgagca aatggcggaa aagaagcagg agctggagaa
     3301 gcggctgcag gacgtcaccg gccagctggg tgcaagcaag aaaaacgcca agaaagatga
     3361 ttccacctca aacaaagtgg aagctgtgca gccagcgaat cccgtgtcgt cgagttccag
     3421 ttccagcgat tcatcgtcct cgagttcgag tgatagcagt tcgagtgact cgagcgacag
     3481 tgaagcaggt taggacgcgt tttgtttgtt tgttttacct tataacgcct tttttttttg
     3541 ttagtttata tagacatata tacgtatgca tatatatata tatatatata tatatatata
     3601 aatatgaata tatatgtata gaaacgtttt taagcagcaa ataacaaaat cgaacagatc
     3661 gacgacagta accgacagta acttacagct tacgaaacta aaagcgtgcg gtagaggaag
     3721 aggaatagca aagcaggtag