PREDICTED: Drosophila obscura ubiquitin carboxyl-terminal hydrolase


LOCUS       XM_022367788            3762 bp    mRNA    linear   INV 14-MAY-2021
            16 (LOC111074830), mRNA.
ACCESSION   XM_022367788
VERSION     XM_022367788.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; includes ab initio.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022367788.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio :: 3% of CDS bases
            ##RefSeq-Attributes-END##
FEATURES             Location/Qualifiers
     source          1..3762
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3762
                     /gene="LOC111074830"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 96% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 5 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111074830"
     CDS             22..3600
                     /gene="LOC111074830"
                     /codon_start=1
                     /product="ubiquitin carboxyl-terminal hydrolase 16"
                     /protein_id="XP_022223480.2"
                     /db_xref="GeneID:111074830"
                     /translation="MEATANGNIRKKRAKKGARAKQLLAMGKKRQMDNHDNASSTDSG
                     QEDSHGQTAGASGSASAAGAGSLGADSPMTNCCQHIKKSVDAARLRRQLKTTGLVYEC
                     SQCQKISQSAASGSGSGVDLACDFEIDSTLWLCLKCGTQLCGRSRKQHALQHYKTPHS
                     DSHALAMNTRSFEIWCYGCDNKVIPNSRKNLLECVELVKRLAQKPPADPPVEATVVAA
                     PSPPIITDIELKLKSALNRLKPIVPMTGGSFEDNNSTGRSGGKALTSNLTAIPLPSPP
                     GATASSPVPGMAKRIDSAAVGSNPNRPCSPRSELERLPRVRGLTNLGNTCFFNAVMQC
                     LAQTPFLLRVLRELAEPGEEFELPGGTFDFKDKGPTDLPIIRGTLSSWGGLTSALANA
                     LEELQVGGGVFTPSKLFDRLCAKCPQFTGGDQHDAHELLRQLLESVRNEDLKRYQRVI
                     LQNLGYKDEDIQSVSEEMRQKCKIYGNQAGDRILRPEQVFRGFLVSTLTCQDCHSVSS
                     RHEYFLDMSLPVAVEKPQPPQRRRPSPESSPFPIAGQTQTQTQNQSQSQSPTKINTKF
                     TTPEDSNPFSTACSSSSSFYLHANEQEPVGPSKSQVKKEKERERKAKRAAKHHRYKQA
                     QKLTLNLNGNGTGSQADESDAGTGRVTSSGGGDGDGQTTSDGQDPPKEDLMSSSSTTS
                     ENSDADVEDNLMDETASARDRTKPRGATGGSSSSPAQGGSNSSSSRRFFTDTNGNAQP
                     LGEKRDDTPENMDKDSLEEDENDSGIATSPLPSGISKTTTTTTANNNEASRGAEQQQP
                     QKDKKEEGQASADIVTAGVSEVGASTIRQISVELDLPTNGDVREEAGEANGDADANAT
                     LQLQEIAHQLAISEFTLEATAATAASATAEGVAAAAAAAGVAAAARAKRVRTYSYSDW
                     STTIAPRYQCEDGECSVQSCLNNFTAVELMTGQNKVGCESCTLRLNGNDTKAKSVNTN
                     ATKQLLVSSPPAVLILHLKRFQLGPRCIFRKLTRPVSYPNMLDIAAFCGSKVKNLPNI
                     DRKQKKLLYALYGVVEHSGGMYGGHYTAYVKVRPKVTPEDNRWKFLPHGSKAELDQDD
                     EQLKKLEELLAKEKASRLLHLNSMNDSDDFTNSSSNSSTSDEFNTNPNGGTGQDGHHE
                     QQEEEAANVQAPPGKWYYVSDSRVQEVSEDAALKAQAYLLFYERIY"
     misc_feature    391..582
                     /gene="LOC111074830"
                     /note="Zn-finger in ubiquitin-hydrolases and other
                     protein; Region: zf-UBP; pfam02148"
                     /db_xref="CDD:460464"
     misc_feature    973..>1590
                     /gene="LOC111074830"
                     /note="Peptidase C19 contains ubiquitinyl hydrolases. They
                     are intracellular peptidases that remove ubiquitin
                     molecules from polyubiquinated peptides by cleavage of
                     isopeptide bonds. They hydrolyse bonds involving the
                     carboxyl group of the C-terminal Gly...; Region:
                     Peptidase_C19; cl02553"
                     /db_xref="CDD:470612"
     misc_feature    <2779..3588
                     /gene="LOC111074830"
                     /note="A subfamily of Peptidase C19. Peptidase C19
                     contains ubiquitinyl hydrolases. They are intracellular
                     peptidases that remove ubiquitin molecules from
                     polyubiquinated peptides by cleavage of isopeptide bonds.
                     They hydrolyze bonds involving the carboxyl...; Region:
                     Peptidase_C19K; cd02667"
                     /db_xref="CDD:239132"
ORIGIN      
        1 agaaagtcaa cgacaaaggg aatggaagcg acagccaatg gaaacattag aaaaaagcgc
       61 gccaaaaagg gggctagagc gaagcagttg ctcgccatgg ggaagaagcg tcagatggac
      121 aaccacgaca atgccagttc aacggactcg ggccaggagg atagccacgg ccagacggcc
      181 ggtgccagcg gctcagcaag cgctgcagga gctggcagct tgggtgcgga tagccccatg
      241 accaactgct gccagcacat caagaaatcg gttgatgcgg cccggttgcg gcgtcaactg
      301 aaaaccaccg gcctggtata cgagtgctcg cagtgccaga agatcagcca gtccgctgca
      361 tccggttcag gctccggcgt agatctggcc tgcgacttcg agatcgacag cacgctctgg
      421 ctgtgcctca agtgcggcac ccagctctgc gggcggtcac gcaagcagca cgccctccag
      481 cactacaaga caccacactc ggactcgcat gcactggcca tgaacacacg atcatttgag
      541 atatggtgct atggctgcga caacaaggtc atccccaact cccgcaagaa cttgctcgag
      601 tgcgtcgagc tggtgaagcg tctggcccag aagccgcccg ccgatccacc tgtggaggcc
      661 actgtcgtgg ccgctcccag tccacccatc atcaccgaca tcgaactgaa attgaaatcg
      721 gccctaaatc ggctcaaacc cattgtgccc atgacgggtg gctcgttcga ggacaacaac
      781 agcaccggca gaagcggtgg gaaggccctg acaagtaacc taacagccat acccctgccg
      841 tcacccccag gagccaccgc cagcagccct gttccgggca tggccaagag gatcgactcc
      901 gccgccgtcg gcagcaatcc gaatcgcccg tgctcaccca ggagcgaact ggagcgacta
      961 ccgcgtgtcc gtggactgac caatttgggc aacacttgct tcttcaatgc tgttatgcag
     1021 tgcctcgccc agaccccgtt cctgctccgt gttctccggg agctggcgga accaggagaa
     1081 gaatttgagc tgcccggagg gacgttcgat ttcaaagaca agggccccac cgacttgccg
     1141 atcatccggg gcaccctctc ctcctggggc ggcctcacct cggcgctggc caacgcgctc
     1201 gaggagctgc aggtgggtgg tggcgtcttc acacccagca agctctttga caggctgtgc
     1261 gcgaagtgtc cgcagttcac gggcggggac cagcacgacg cccacgagct gctgcggcag
     1321 ctgttggaga gcgtgcgaaa cgaggatctc aagcgctatc agcgcgtcat cctgcagaac
     1381 ctcggctaca aggacgagga catacaaagc gtgtcggagg agatgcggca gaagtgcaag
     1441 atctatggca accaggccgg cgaccgcatc ctgcgaccag agcaggtctt ccgcggattt
     1501 ctcgtctcga cgctgacctg ccaggactgc cacagtgtct cgtcgcggca cgaatacttc
     1561 ctggacatgt ccctgccggt ggccgtcgag aagccccagc caccacagcg gcgcaggccc
     1621 agccccgaga gctcgccctt tcccatcgcc ggccagacac agacacaaac acagaaccag
     1681 tcgcagtcgc aatcccccac caagataaac accaagttca cgacgcccga ggatagcaac
     1741 ccgttctcga cggcttgttc ctcctcctcc tcgttctacc tgcacgcaaa cgagcaggag
     1801 cccgtcggtc cgtccaagtc gcaggtgaag aaggagaagg agcgcgagcg caaagcgaag
     1861 cgggcggcca agcaccatcg ctacaagcag gcacagaagc tcaccctcaa cctgaacgga
     1921 aacggaacgg gaagccaggc cgatgagtcg gatgccggca cagggagagt gacatcgtcc
     1981 gggggcggcg acggcgatgg ccagacgacc agcgatggcc aggatccgcc caaggaggat
     2041 ttaatgtcat cgagctccac cacatcggag aactcggacg ccgatgttga ggacaatttg
     2101 atggatgaaa cggcaagtgc cagggacagg actaagcccc gaggggccac cggcggctcc
     2161 tcatcctcac ccgctcaggg aggcagcaac agcagcagca gcagaagatt cttcaccgac
     2221 accaatggca atgcccagcc gctgggggag aagcgggacg acacgcccga gaacatggac
     2281 aaggactccc tcgaagagga tgagaacgac tctggcatag ccaccagtcc gttgcccagc
     2341 ggcatcagta aaacaacgac gaccaccacc gccaacaaca acgaggcttc cagaggtgca
     2401 gagcagcaac agccacagaa ggataagaag gaggagggcc aagcctctgc ggacatagtc
     2461 acagcgggcg tgagcgaggt gggtgcctcc accatacgcc aaatctcggt tgaattggat
     2521 ctgccaacga atggagacgt ccgagaggag gcgggtgagg cgaatgggga tgcggatgcg
     2581 aatgctacgc tccagctgca ggagatagcc caccagctgg ctataagtga attcaccttg
     2641 gaggccacag cggcaactgc agcttcggcc acagccgagg gggtggcagc agcagccgcg
     2701 gcggcaggag tcgcggcagc agcacgcgcc aagcgtgtgc gaacgtacag ctattcggac
     2761 tggagcacca cgatagcgcc gcggtaccag tgcgaggacg gagagtgctc cgtgcagtcc
     2821 tgcctcaaca acttcaccgc cgtcgaactg atgaccggcc agaacaaggt ggggtgcgag
     2881 agctgcaccc tgcggctgaa tggtaacgat acgaaggcca agtcggtcaa tacgaatgcc
     2941 accaagcagc tgctcgtgtc cagccctccg gcggtgctca ttctccacct gaaacgcttc
     3001 cagcttgggc cgcgctgcat attcaggaag ctaacgcggc cggtcagcta tccaaacatg
     3061 ctggacattg ccgccttctg cggatccaag gtgaagaatc tgcccaatat cgatcgcaag
     3121 cagaagaagc ttctgtacgc cctctacggg gtggtggagc actcgggcgg catgtatggc
     3181 ggccactata ccgcctacgt taaggtgcgg cccaaggtga cgccggagga caatcgctgg
     3241 aagttcctgc cgcacggcag caaggccgag ctcgatcagg atgacgagca gctgaagaag
     3301 ctggaggagc tgctggccaa ggagaaggcc tcgcgccttc tgcacttgaa ctcgatgaac
     3361 gacagcgacg acttcaccaa ctccagcagc aattcatcta cctcggacga gttcaatacc
     3421 aatcccaatg gcggtaccgg ccaggatggc catcacgagc agcaggagga ggaggctgcc
     3481 aatgtgcagg cgccgccagg gaaatggtac tacgtatccg attcgcgggt ccaggaggtt
     3541 agcgaggacg cggcgctcaa ggcccaggcc tatctgctct tctacgagcg catctactaa
     3601 gggggaggag actggaaatg ggactagaac tagcccaagg gacaacgaga actactacta
     3661 ggcactatgg acgggggaaa gcaacaagag aagagaaaag agaagaaaag aaaagagaga
     3721 gaaagaggag cagcagccat cgttccatta tatagcttac ga