PREDICTED: Drosophila obscura trypsin (LOC121403885), transcript


LOCUS       XM_041591965            1629 bp    mRNA    linear   INV 14-MAY-2021
            variant X3, mRNA.
ACCESSION   XM_041591965
VERSION     XM_041591965.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..1629
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..1629
                     /gene="LOC121403885"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 10 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 5 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:121403885"
     CDS             137..1108
                     /gene="LOC121403885"
                     /codon_start=1
                     /product="trypsin I-P1 isoform X3"
                     /protein_id="XP_041447899.1"
                     /db_xref="GeneID:121403885"
                     /translation="MDTPWQLQVLLQMLLSWTLAANGHRKFVMLPKVVGGYSITIEQV
                     PFQLSVRRRTMHERAYGLGLICGGALISQRVACSAAHCYAVNNTHNPVRYHDPTMFVV
                     VAGSTQIDQADRHTKEYLVQQIIAHSAYNASSLENDIALLFLNGYVSWQSRAVRAIPL
                     ATKAQTEGTTCLINGWAANLFPKVGKSASLQQAPVPILNKSLCRAIYMLPVSQLCAGF
                     MQGGIDACQGDSGGPLICDGQLAGIISWGVGCADPGFPGVYTNVSHFVDWIQMVNATL
                     DYSKYTVVGSADLASGAQRTWWLALAFLLIALGGSWSGGWNLNWNWG"
     misc_feature    233..952
                     /gene="LOC121403885"
                     /note="Trypsin-like serine protease; Many of these are
                     synthesized as inactive precursor zymogens that are
                     cleaved during limited proteolysis to generate their
                     active forms. Alignment contains also inactive enzymes
                     that have substitutions of the catalytic triad...; Region:
                     Tryp_SPc; cd00190"
                     /db_xref="CDD:238113"
     misc_feature    233..235
                     /gene="LOC121403885"
                     /note="cleavage site [active]"
                     /db_xref="CDD:238113"
     misc_feature    order(377..379,548..550,824..826)
                     /gene="LOC121403885"
                     /note="active site"
                     /db_xref="CDD:238113"
     misc_feature    order(806..808,869..871,875..877)
                     /gene="LOC121403885"
                     /note="substrate binding sites [chemical binding]; other
                     site"
                     /db_xref="CDD:238113"
ORIGIN      
        1 gaacatcgat acatccatca gctacccggc agcttgaaag gcaaaacttt gtttacgttt
       61 tgttattgag ctttagttga gctaaacaaa caaaacaaaa acagggtgcc gtgaagattt
      121 gtatggaatt attacgatgg acacaccgtg gcagctgcag gtgctcttgc agatgcttct
      181 atcgtggaca ttggcggcca acgggcatcg caagttcgtg atgctgccga aggtggtggg
      241 cggctattcg ataacgatcg aacaggtccc gttccagctg tcggtgcgtc gccggacgat
      301 gcacgaaagg gcatacggat tgggcctcat ctgtggcggg gcattgatct cgcagcgtgt
      361 ggcctgctcg gcggcccact gctatgccgt aaacaacaca cacaacccgg tgaggtatca
      421 cgatccgacc atgttcgtgg tggtggcggg cagcacacaa atcgaccagg ccgacaggca
      481 caccaaggag tatctggtgc agcaaatcat cgcccacagc gcctacaatg cctcctcgct
      541 ggagaacgac atcgcgctgc tcttcctcaa cggctacgtg tcgtggcagt cgagggccgt
      601 gcgagccatt ccgctggcca ccaaggccca gactgagggc accacgtgcc tgatcaatgg
      661 ctgggctgcg aatctcttcc cgaaggtggg caaatcggca tcgctgcagc aggcgccggt
      721 gcccatcctg aacaagagcc tctgccgtgc catctacatg ctgccagtgt cccagctgtg
      781 cgctggcttc atgcagggcg gcatcgatgc ctgtcagggt gactctggcg gtcccctaat
      841 ctgcgacggc cagctggcgg gcatcatctc gtggggcgtg ggctgtgcgg atcccggctt
      901 tcccggcgtc tataccaatg tctcgcactt tgttgattgg atccaaatgg taaacgccac
      961 gctcgactac tccaaataca cggtggtggg ctcggcggat ctggccagcg gtgcccaacg
     1021 tacctggtgg ctggccttgg catttctgct tatcgctctg ggcgggagct ggagcggggg
     1081 ctggaacttg aactggaact ggggctgatg atgtgcgggc caagatatgg aatgttggac
     1141 agcaataata aaatcatcat tcagcttgtc tcttctgtca tttaataatc taatcatctc
     1201 cgcatacgca cttgtgtatc gattgcccaa ccatagatac agaaatcgaa ttgccgtatg
     1261 actaaaaggg tgacacaata accaatttta atcagccaca aggactggga cagggagtgg
     1321 gactgggact gggagtgttg cgcctgcccc tcaagatcaa agaccgagaa aacccaacga
     1381 cctacaccta cctccaagac ccaacaaata tcgttttaac tgctcgattc tgtgggttcc
     1441 aatagataat atttattaac ggataagagc gcattcaata tatctgattg ttatctgatg
     1501 atatgccaaa tcaaatcata attggatcat aaatatgtac agacaatacg agaatgaacc
     1561 gaaaagtaca aacctccttt tggatttttg attgttgcaa ttgccgagcc tcgaacctct
     1621 tcaaaatat