PREDICTED: Drosophila obscura TATA element modulatory factor


LOCUS       XM_022367793            3278 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111074831), transcript variant X2, mRNA.
ACCESSION   XM_022367793
VERSION     XM_022367793.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022367793.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3278
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3278
                     /gene="LOC111074831"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 2 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111074831"
     CDS             141..3110
                     /gene="LOC111074831"
                     /codon_start=1
                     /product="TATA element modulatory factor"
                     /protein_id="XP_022223485.2"
                     /db_xref="GeneID:111074831"
                     /translation="MSWFEKAKTVLIEALDIQDDDRDKAAEKDGVTAGSGGGGGSGGS
                     SDTGATSSGAALVSQTTSSDTPTFFDNPHANEMVTIPPRASDPAVTTPTPTSTSAAMG
                     MGNPYAKRHSATSDSVDLLSSPSPTSPEGDAASAMENSESSLELITATTASEMEMSPD
                     TEPSLPGSIVIIASNETSDNAEGDGEDDDDDDDGTQLERHLEDHLNDSTKTMKALVFS
                     DTQAAANVTGADSDSTQSFEDIQMQMSHKDKAGGKGQGQDGEGEAKAEVVDQSYSSTS
                     SDIEIISNPNGDSSTNSTTTRTSPQKFKELGSSSSRSGAGTGTGLTGQVLKPKGHHRE
                     PSEISLLSEDSQSELDKLVNRISELNQVIEAREQRLLQSERQNAELLERNQELRASVE
                     AAANSANSPDAAEAVQRLSALEKKFQTSIRERDALRIQIKSLKDELLNKIPKDELAEC
                     NEMIAALQSEGEKLSKEILQQSIIIKKLRAKEKTSDTLLKKNGEQISLLSSESERLKK
                     SLAAKEEMERTQIEAVGRMTHEKRRVDEENADCRSRVEDLQSKLSALQSSFDGVRGDL
                     VKRTRVEQDSLRAENQEYVQQLGDMREKLRHAEHSLAKREQQLREENRQLLRRLEAAE
                     LRAESSTQELSVTTTPLIRQIESLQKTLNQRTASWNKEEQLLIQRADDAQLQLRSVQQ
                     LESVQNEKQELLRTRCSLLEAKLSSALAEVESARMALSQLEHDASLKESSHSRKLATL
                     QEQLQAHQERIVGLEEQQQCQQRQQQQKADAEAERETLQRQPMPSLLTVEAVKASSEM
                     QPHKSPVHSPHSALRQHSPPLSLADESGSTEDAMMGGIIDWQTDDLDCASNSGRNQSG
                     IIQGVHLSFMAGNTTTLEHLQSLLKQRDGELTHLQWELSRLQAERGVLDGEISHLTIE
                     LETMKEKMQSYEAMEKCYEDLQHRYDALLQMYGEKVERTEELELDLVELKSAYKLQID
                     ELLANPPPNLQRPAKHT"
     misc_feature    <1149..>2483
                     /gene="LOC111074831"
                     /note="Chromosome segregation ATPase Smc [Cell cycle
                     control, cell division, chromosome partitioning]; Region:
                     Smc; COG1196"
                     /db_xref="CDD:440809"
     misc_feature    2721..3062
                     /gene="LOC111074831"
                     /note="TATA element modulatory factor 1 TATA binding;
                     Region: TMF_TATA_bd; pfam12325"
                     /db_xref="CDD:432481"
ORIGIN      
        1 cgccatcgat agttgagggt ccgtatgagc tggaaataca atttttttgt attatgtgtt
       61 attgaaatca actaattgtg cgagaaaaca attgggattt gcatgtgctt gttgcagttc
      121 agaatcaggc acgcagcgag atgagttggt tcgagaaggc caagacggtg ctcatcgagg
      181 ccctcgacat ccaggatgac gacagggaca aggccgccga gaaggatggc gttactgcgg
      241 ggtcgggcgg tggcggtgga agcggaggat catcggacac gggcgccacg agctctggcg
      301 ccgcactcgt ctcgcagacg acatcctcgg acacgcctac attcttcgac aatccacacg
      361 ccaacgagat ggtaaccatt ccacccagag ccagcgatcc ggccgtaacc acgcccacac
      421 ccacatccac atccgcagca atgggcatgg gtaatccgta tgccaagcga cattcagcca
      481 catcggactc cgtcgatctg ctctcctcgc catcgcccac atcgcccgag ggcgacgccg
      541 cctccgcgat ggagaactct gaatcttcgc tggagctaat cacggccacg acggccagcg
      601 agatggagat gtcgccggac acggagccct cgctgcccgg cagcatcgtg atcatagcca
      661 gcaacgagac ctccgacaat gccgaaggcg atggcgaaga cgacgacgac gatgacgatg
      721 gcacccagct ggagcggcac ctggaggacc atctaaatga ttccacaaag accatgaaag
      781 ccctggtgtt tagcgacacc caggcggccg ccaatgtgac gggcgccgat tcagactcca
      841 cgcagagctt cgaggacatc caaatgcaga tgagccacaa ggacaaggcc ggtggaaagg
      901 gacaaggaca agatggcgag ggcgaggcca aagcagaggt ggtcgaccag agctactcgt
      961 ccacctcctc ggacattgag atcatttcca atccgaacgg ggactccagc accaacagca
     1021 caacgacgcg cacgagtccg caaaagttca aggagctggg cagcagcagc agccggtctg
     1081 gggctgggac aggcacaggg ctgactggac aggtgctcaa gcccaaggga caccatcgcg
     1141 agccctcaga gatatcgctg ctgtcggagg actcgcaatc ggagctggat aagctggtga
     1201 atcgcattag cgagctgaac caggtgattg aggcgcgcga gcagcgcttg ctgcagtcgg
     1261 agcgacagaa cgccgagctg ctggagcgca accaggagct tcgcgcctcc gtggaggcag
     1321 cggcgaacag cgccaacagt ccggatgccg cggaggccgt acagcggttg tcggcgctgg
     1381 agaagaagtt ccagacgagc atacgggagc gggacgcgct gcgcatccag atcaagagcc
     1441 tcaaggacga gctgctcaac aagataccca aggacgagct ggccgagtgc aacgagatga
     1501 tcgcagcgct gcagtcggag ggcgagaagc tctccaagga gattctccag cagtcgatca
     1561 tcatcaagaa gctgcgcgcc aaggagaaga cctcggacac gctcctcaag aaaaacggcg
     1621 agcagatctc gctgctgtcc agcgaatcgg agcggctcaa gaagtccctg gccgccaagg
     1681 aggaaatgga gcgcacgcag atcgaggcgg tgggccgaat gacccacgag aagcgacgcg
     1741 tcgatgagga gaacgccgac tgccgcagtc gtgtcgagga tctgcagtcg aaactgtcgg
     1801 cccttcagtc cagctttgac ggcgtccggg gcgatctggt taagcggacg cgcgtggagc
     1861 aggacagcct cagggccgag aatcaggagt acgtccagca gctgggcgac atgcgggaga
     1921 agctgcgcca cgccgagcac agtctggcca agcgggagca gcagctgcgg gaggagaacc
     1981 gccagctgct gcgacgcttg gaggctgccg aactgcgagc ggagagctcc acgcaggagc
     2041 tgagcgtcac caccaccccg ctgatccgcc agatcgagtc gctgcagaag accctcaacc
     2101 agcgcaccgc ctcctggaac aaggaggagc agctgctgat ccagagggcc gacgatgccc
     2161 agctgcagct gcgctcggtg cagcagctcg agtcggtgca gaacgagaag caggagctgc
     2221 tgcgcacgcg gtgcagcctt ctcgaggcga agctctccag cgctctggcg gaggtggaga
     2281 gtgccaggat ggccctcagc cagctggagc acgatgccag cctcaaggag agctcacaca
     2341 gcagaaagtt ggccacgctg caggagcagc tgcaggcgca tcaggagagg attgtgggcc
     2401 tagaggagca gcagcagtgc cagcagcgcc agcaacagca gaaggccgat gccgaggctg
     2461 agcgggaaac cttgcagcga cagcccatgc ccagcctgct taccgtagag gccgtcaagg
     2521 ccagcagtga aatgcagccg cataaatctc cggttcattc cccacactct gcgctgcgcc
     2581 agcactcgcc tccgctcagt ctggccgatg agagcggctc cacggaggat gcgatgatgg
     2641 gcggcatcat tgactggcag acggacgacc tggactgtgc ctccaactcg ggccgcaacc
     2701 agtcgggcat catccagggc gtccacctga gcttcatggc gggcaacacc acaacgctgg
     2761 agcatctgca gtcgctgctg aagcagcgtg acggcgagct cacacacctc caatgggagc
     2821 tgtcgcgcct gcaggccgag cgcggtgtgc tcgacggaga gatatcccat ttgacgattg
     2881 aactggagac gatgaaggag aaaatgcagt catacgaggc catggagaag tgctacgagg
     2941 acctgcagca tcgctacgat gccctgctcc agatgtacgg cgagaaggtg gagcgcaccg
     3001 aggagctgga actggatctg gtcgaactga agtccgccta caagctgcag atcgacgagc
     3061 tgctggccaa tccacccccg aacctgcaga ggccagcgaa gcacacatga ttgccggaac
     3121 gcagaagcat ctactgtgtc tcgctgccca atctgacatg cctgcggcga tcctagtccc
     3181 gtttcccact accaattacc attcccgatg ggccattatc cttatcctac catactctgg
     3241 ctaacgtcgg gggaatgaga gcagcgcagg gcagggca