PREDICTED: Drosophila obscura homeotic protein female sterile


LOCUS       XM_041591941            6245 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072429), transcript variant X1, mRNA.
ACCESSION   XM_041591941
VERSION     XM_041591941.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..6245
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..6245
                     /gene="LOC111072429"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 11 Proteins, and 99% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072429"
     CDS             170..6091
                     /gene="LOC111072429"
                     /codon_start=1
                     /product="homeotic protein female sterile isoform X1"
                     /protein_id="XP_041447875.1"
                     /db_xref="GeneID:111072429"
                     /translation="MSSNEPPPRYEPPVEPVNGIVQPAVVPPVDRPGRNTNQLQFLIK
                     TVMKMIWKHHFAWPFQQPVDAKKLNLPDYHKIIKQPMDMGTIKKRLENNYYWSAKETI
                     HDFNTMFNNCYVYNKPGEDVVVMAQTLEKVFLQKIETMPKEELELEPATAKGGKKKAR
                     APATPKSGSGGGGGTGSSTGAAVANSNTGSSNSGSINKVAPSAQQLPIMGSGLAAQST
                     GAGGHGSATGSGTTSRPVSAMGGTVSSTAGGGGAPSIPPISTMPPHTVPGSTNTTTTA
                     TTMVDAIIASLRNPSQAAYPGATQAAANSSSLLDGSSSAAASAAATTAAATAAAAAAA
                     AAAAAAAAASSSGGGAGAPGTVSTAGGVTIPSVNTTTNVHSSYVNSTAGVGVGVDAVI
                     PPQQPAKMKKGVKRKADTTTPTANAFESPYAQMDSKSAKIATRRESNRQDLTFQGSGY
                     AMSPSMGVVPGLAAGVAASVAAAKSKEKLSDALKSCNEILKELFSKKHSGYAWPFYKP
                     VDAEMLGLHDYHDIIKKPMDLGTVKRKMDNREYKSAPEFAADVRLIFTNCYKYNPPDH
                     DVVAMGRKLQDVFEMRYANIPDEPVSNAAHHHAHTHGHGHGHGHGQSHGHGHGHGHGG
                     YSSASLKHDGSDSSSEDSSGTENESNSDEERSAKLKMLESKLLGLQEEIRKLSEEASA
                     KKKAKKKLKEKKKSIGGGSGSGSASHHAHASAGGGAGGPSASHGGVSVPASVVALSAG
                     GAAGPNLSALLSGSLVGASGAGGGVPNVSALHSLAHDMTLAMNQLTGNAAATGAGFTA
                     GIPPPGPAPGGKGANMASAMAAAGAGPGASGGTGGSSKSKSKGQRGKGSSSNAGAGGA
                     SSGVTVNAGSGIGGAGAASSAGSGGGSGTTGPSGNSSKRGKGSSSAGGGGGGSSGSAA
                     NTTSATGAGARGSSKKKPSQVMNFDSEEEDTAKPMSYDEKRQLSLDINKLPGDKLGRV
                     VHIIQNREPSLRDSNPDEIEIDFETLKPSTLRELESYVASCLRKKTHKKPSGKSKDEQ
                     MAEKKQELEKRLQDVTGQLGASKKNAKKDDSTSNKVEAVQPANPVSSSSSSSDSSSSS
                     SSDSSSSDSSDSEAGDGDERPPRKKKPRDSNGSNVNNPSLSVVLGGTLPSGGLTPTLL
                     HMGLDHVLNANSPTSQMANLLGNPNPLTAAAMLNNNNKTTLQVGGSFGGASAGGNNSM
                     LHGQVGATAHHKNGQNDHLMTSKMPPGGGAAGAASLPPHSYAGSVPTQAASLGGGGIR
                     IASNLHKQPNLPGGDLVENNAALTAALTSTVNSNSGSGAGVGVAAGLSNTSSGTASGH
                     THNTNTMGGQGDGLPGASLASGLKQIPQFDDPVEQSLASLEFSAAAASTGKSGLTDNF
                     LMAQQGHLMQQPGLQQQPPFGHHQQQQQQQQQQQHHPMDYMTELLTKGTENVPGMNGN
                     LLNFNLDMAAAAAYQQKQHHGQHTQQQQQQQQQQQQQQQQQQASHNNGFNVADFGMPG
                     FDNLTATAFLDLEHTLQQQHMQLQQQQQQQQQHHHQQQSLQQLHAHQQQLANKMLLIK
                     PIESMMPSPPDKLKVMLKVSQSPSDLKLHSSQAAAAQSMLAQSFKAAEQNLKNASSWS
                     SLASASSPQNTSSSSSSSKPKPAMDSFQQFRNKAKERDRLKLLEAAEKEKKHQKEAAE
                     KEQQRKHHKSSSSSSAAQAVQAAAAAAAVAAAAAAAAAAAASSTNISTGNAPQSGAGQ
                     ISSDRERSSSAVDATRMGSGGGGNGGLLLPGNGNNSSNSANSNGPGSAGSGSGGPVSG
                     GLASGGGPNSGGCIIGPLANTGSNSNSGVGSGATSSNSNSSVGGVVGSGGPGSNSQGS
                     SGGGGTMGSGLLEYGPQVVVLTQAAANAQAQHVSTTMTAQTVLASSPLEAMESGRKSV
                     HDTQSQISRVEDIKASPGQGQSSPAQQSPQDRAAAKRAEQRRAEQERRRREALAGQID
                     MNMQSDLMAAFEETL"
     misc_feature    269..589
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat I. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_I_like; cd05497"
                     /db_xref="CDD:99929"
     misc_feature    order(356..358,377..379,386..388,503..505,515..517,
                     533..535)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99929"
     misc_feature    1616..1918
                     /gene="LOC111072429"
                     /note="Bromodomain, Brdt_like subfamily, repeat II. Human
                     Brdt is a testis-specific member of the BET subfamily of
                     bromodomain proteins; the first bromodomain in Brdt has
                     been shown to be essential for male germ cell
                     differentiation. Bromodomains are 110 amino...; Region:
                     Bromo_Brdt_II_like; cd05498"
                     /db_xref="CDD:99930"
     misc_feature    order(1694..1696,1715..1717,1724..1726,1841..1843,
                     1853..1855,1871..1873)
                     /gene="LOC111072429"
                     /note="acetyllysine binding site [active]"
                     /db_xref="CDD:99930"
     misc_feature    3011..3205
                     /gene="LOC111072429"
                     /note="Bromodomain extra-terminal - transcription
                     regulation; Region: BET; pfam17035"
                     /db_xref="CDD:435704"
     misc_feature    <6026..6088
                     /gene="LOC111072429"
                     /note="C-terminal domain of bromodomain protein 4; Region:
                     BRD4_CDT; pfam17105"
                     /db_xref="CDD:465349"
ORIGIN      
        1 agcagcagca gcagtacaac cagcatccac ttgaggatca gataccttaa aagcaaccgc
       61 aacaggagca gggacaaaag caacaaccag aagcctcatc atcagccaac aggaggagca
      121 gcagtagccg cagcaccact gtgtcaccat catcaccatc atcaacaaca tgtcgtccaa
      181 cgaaccacca cctcgctacg agccgcctgt ggagccggtc aatggcattg tgcagccagc
      241 ggttgtgcct ccagttgatc gacccggccg caatacaaat caattgcaat tcttgatcaa
      301 aaccgtaatg aagatgatat ggaaacacca ttttgcgtgg cccttccagc agcccgtcga
      361 cgcgaaaaag ctcaacctgc ccgactacca caagatcatc aagcagccga tggacatggg
      421 aacgatcaag aagcgactgg agaacaacta ttactggtcg gcgaaggaga ccatccatga
      481 cttcaatacc atgttcaaca actgctatgt ctacaacaag cccggcgagg atgtggtcgt
      541 gatggcccag acgctggaga aggtattctt gcagaagatc gagacgatgc ccaaggagga
      601 gcttgaactg gagccggcca cggccaaggg tggcaagaag aaggcacgtg ccccggccac
      661 gcccaagtct ggatcaggag gcggaggtgg aacgggatca agcacgggtg cagctgtcgc
      721 caatagcaac actggcagca gtaacagcgg atctatcaat aaggtagcac catcggccca
      781 acagttgccc atcatgggca gcggcctggc ggcacagtca acgggtgcag gaggccatgg
      841 atcagcgacg gggtcgggga caacatcccg acccgtatca gcgatgggcg gaacggtttc
      901 atcgacggcc ggcggcggcg gtgcaccgtc cataccaccg attagcacaa tgcctccgca
      961 cacagtcccc ggcagcacca acaccacgac gacggccacg acaatggtcg acgccattat
     1021 agccagcctt cggaatccca gccaggccgc atatccgggc gctacccagg cggcggctaa
     1081 cagctcctcc ctactggacg gcagcagcag tgcggcagca tcggcggcgg caacaacagc
     1141 agcggcgacg gcagcagcag cggcagcagc agcagcagcg gcggcggcag cagcagcatc
     1201 atcatctggc ggtggagcgg gagctcccgg tacagtcagt acggcgggtg gtgtgacaat
     1261 accatccgtc aataccacca ccaatgtgca ctcctcctac gtgaacagca cggcgggcgt
     1321 cggagttggt gtggatgcgg ttataccgcc ccaacagccg gcgaaaatga agaagggtgt
     1381 caaacggaag gcggacacaa cgacgccgac ggccaatgca tttgagtcgc cctacgccca
     1441 aatggactcc aagtcggcca agatagcgac gcgaagggaa tcgaatcgtc aggatcttac
     1501 attccagggc tcgggatatg cgatgtcgcc atcgatgggt gtcgtgcctg gattggcggc
     1561 gggtgtggcc gctagtgtgg cggcggccaa gtcaaaggag aagctgtcgg atgcactaaa
     1621 gtcatgcaac gagatcctca aggagctgtt cagcaagaag cactcgggct atgcctggcc
     1681 cttctacaag ccggtggatg cggaaatgct gggcctccat gactaccacg acatcatcaa
     1741 aaagcccatg gacctgggca ccgtcaagcg gaaaatggac aatcgggagt acaagagcgc
     1801 accggagttt gcggccgatg tgcgattaat attcaccaac tgctacaagt acaatccgcc
     1861 agatcatgat gttgtggcca tgggccggaa gctgcaagac gtcttcgaaa tgcgctacgc
     1921 caacataccc gacgaaccgg tctctaatgc ggcccatcat catgcacata cgcacggaca
     1981 tgggcacggc catggacacg gccagagtca cggtcacggg catgggcatg ggcacggtgg
     2041 ctattcgagt gcttccctca agcacgatgg cagcgactcg tccagcgagg actccagcgg
     2101 cacagagaac gagtcgaact cggacgagga gcgcagcgcc aagctgaaaa tgctcgagtc
     2161 caagctgctc ggtctccagg aggagatccg aaagctctcc gaggaggcct ccgcaaagaa
     2221 gaaggccaag aaaaaactca aagagaagaa gaagagcatc ggtgggggct ctggttccgg
     2281 ctcggcctct catcatgccc atgcctcggc tggtggtggc gcaggtggtc cgtccgccag
     2341 ccatggtggc gtctctgttc cggccagcgt cgttgcccta tcggcgggcg gagcagcggg
     2401 acccaaccta tcggccttac tcagcggttc gctggtgggc gcgagcggag cgggcggcgg
     2461 agtgcccaac gtctcggccc ttcattcact cgcccacgac atgacccttg ccatgaacca
     2521 actgacgggc aatgcggcag cgaccggagc tggctttacg gccggcatac cgccaccggg
     2581 accagcgcca ggcggcaagg gggccaacat ggccagcgcc atggctgcgg cgggagcggg
     2641 accaggggct tctgggggaa ccggcggcag cagcaaatcg aagagcaagg gccagcgcgg
     2701 taaaggaagc tcgagcaatg cgggagcggg cggagcatcc tctggagtga cggtcaacgc
     2761 gggcagcgga atcggcggtg ctggcgcagc gtccagcgct ggcagtggcg gtggcagtgg
     2821 gactactggc cccagcggca attcctcaaa gcggggcaag ggtagtagta gtgccggcgg
     2881 tggtggtggc ggcagcagtg gcagtgcggc caataccacc agtgcgaccg gtgccggagc
     2941 gcgcggtagc agcaagaaga agcccagcca ggtgatgaac tttgactccg aggaggagga
     3001 cacggccaag cccatgtcgt acgatgagaa gcgacaactc tcactggaca tcaacaagtt
     3061 gccaggcgac aagctggggc gagtggtgca cattatccag aatcgggagc catcgctgcg
     3121 ggactccaat ccggacgaga tagagatcga ctttgagacg ctgaagccgt cgacgctgcg
     3181 cgagcttgaa agctatgtgg cgtcgtgttt gcgcaaaaaa acacataaaa agccttccgg
     3241 caaatcgaag gatgagcaaa tggcggaaaa gaagcaggag ctggagaagc ggctgcagga
     3301 cgtcaccggc cagctgggtg caagcaagaa aaacgccaag aaagatgatt ccacctcaaa
     3361 caaagtggaa gctgtgcagc cagcgaatcc cgtgtcgtcg agttccagtt ccagcgattc
     3421 atcgtcctcg agttcgagtg atagcagttc gagtgactcg agcgacagtg aagcaggtga
     3481 tggagacgaa cgacctccgc gcaaaaagaa gccacgcgac tcgaatggca gcaatgtaaa
     3541 taatcccagc ctcagcgttg ttttgggagg aaccctgccg agtggcggct tgacgccgac
     3601 gctccttcac atgggcctgg accacgtgct caacgcaaac tcacccacat cacaaatggc
     3661 caatctgttg ggcaatccga atcccttgac ggcggctgcc atgctgaaca ataacaacaa
     3721 gacgacgttg caggtcggcg gcagcttcgg cggcgcctcc gcgggcggca acaacagcat
     3781 gctgcacggc caggttggcg caacggcgca ccacaagaac ggacaaaacg accacctaat
     3841 gactagcaaa atgccgcctg gcggtggggc tgccggagcc gcttccctgc cgccccacag
     3901 ctatgccggt agcgtgccca cccaggccgc aagtctgggc ggagggggca tacggatagc
     3961 cagtaatctg cacaagcaac ccaatctgcc cggcggcgac ctggtcgaga ataacgcggc
     4021 gctgaccgct gctttgacgt cgaccgtcaa cagcaacagc ggcagcggcg ctggtgtggg
     4081 agtggccgcc ggcctgagca acaccagcag tggcaccgcc tcgggccaca cacacaacac
     4141 caacacaatg ggtggccagg gggatggctt gccgggtgcc tcgctggcat cgggcctcaa
     4201 gcaaatcccg cagttcgacg atcccgttga gcagtcgctg gcctccctgg agttcagtgc
     4261 ggcagcggcc tccacgggca agtcgggctt aaccgataac tttttgatgg cccagcaggg
     4321 acacctaatg cagcaacctg gtctgcagca gcagccgccc tttggacacc accaacagca
     4381 gcagcaacag cagcaacagc agcagcacca ccctatggac tacatgacgg aactgttgac
     4441 aaagggtaca gagaacgtgc ccggtatgaa cggaaacctt ttgaacttca acctcgacat
     4501 ggcggctgcg gcggcctacc aacagaagca gcaccatggc cagcacaccc agcagcagca
     4561 gcagcaacaa cagcagcagc agcagcaaca gcagcagcaa caggcgtcgc acaacaatgg
     4621 cttcaatgtg gcggactttg gcatgccagg attcgataat ctgactgcaa cagcattcct
     4681 cgacctggag cacacactcc agcagcagca catgcagctg caacagcagc agcagcaaca
     4741 gcaacaacac caccaccaac agcagtccct tcagcagctg catgcccacc agcagcagct
     4801 ggccaacaaa atgctcctca tcaaaccgat cgagtcgatg atgcccagtc cgccggacaa
     4861 gctgaaggta atgctgaagg tatcccaatc gccctccgac ctgaagctgc actcaagcca
     4921 ggcggcggcc gcccagagta tgctggctca atccttcaag gcggccgagc agaacctgaa
     4981 gaatgccagc tcgtggtcat cgctggcatc agccagctca ccgcagaaca cttcgagcag
     5041 ttcgagcagc agcaagccca agccggcgat ggactcattc cagcaattcc gcaacaaagc
     5101 caaagaacgc gaccgcctca agctgttgga ggcggccgag aaggagaaga agcatcaaaa
     5161 ggaggctgcc gagaaggagc agcagcgcaa gcatcacaag tcatcctcgt cctcatccgc
     5221 cgcacaggcg gtccaggctg ccgctgccgc tgcagcagtc gccgcagcag cagctgccgc
     5281 agcggcagcg gcagcctcct caacaaacat ctccaccgga aatgcgcctc agtctggggc
     5341 aggacagata agcagtgata gggaaaggtc cagcagcgct gtggatgcca cccgcatggg
     5401 cagcggtggg ggcggcaacg gcggtctact cctacccggc aatggcaaca acagcagcaa
     5461 ctctgccaac agcaacggac ccggcagcgc gggtagcggc agtgggggcc ccgtcagtgg
     5521 tggcctagcc agtggcggcg gacccaacag tggcggctgc atcatcggac cattggcaaa
     5581 tacaggcagc aacagcaaca gcggcgttgg cagcggggcc acaagcagca acagcaatag
     5641 cagtgtgggc ggagtggtcg ggagcggggg gcccggctca aatagccaag gcagtagcgg
     5701 tgggggcggg acgatgggaa gcggactcct agaatacggc ccgcaggtgg tggtcctcac
     5761 tcaggcggcg gcgaatgccc aggcccagca cgtatcgact acaatgacgg cgcagaccgt
     5821 cctggcttcc tcgcccctgg aggccatgga gagtggcagg aaaagcgtgc atgacaccca
     5881 gtcccagata tcgcgtgtcg aggacatcaa ggcatcgccc ggccagggcc agagttcgcc
     5941 ggcacagcaa tcgccgcaag atcgggcagc ggccaagcgt gcggagcaac gaagagcgga
     6001 gcaggagaga cgcagacgcg aagcgttggc tggccaaatc gacatgaaca tgcagagtga
     6061 tctaatggca gcgtttgagg agacgttgta ggacaaggcc ttcggaggac agcaacggac
     6121 atatacgcat cccagaacca gcatcctcat tgctgctccg agaatgccgt cgtcgctttc
     6181 aaagcggcgg gcggcgagga cgccaaagcc tctgccaaca cagacaacaa tggagagcag
     6241 cacca