PREDICTED: Drosophila obscura trypsin (LOC121403885), transcript


LOCUS       XM_041591963            1710 bp    mRNA    linear   INV 14-MAY-2021
            variant X1, mRNA.
ACCESSION   XM_041591963
VERSION     XM_041591963.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..1710
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..1710
                     /gene="LOC121403885"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 10 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 5 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:121403885"
     CDS             137..1189
                     /gene="LOC121403885"
                     /codon_start=1
                     /product="trypsin I-P1 isoform X1"
                     /protein_id="XP_041447897.1"
                     /db_xref="GeneID:121403885"
                     /translation="MDTPWQLQVLLQMLLSWTLAANGHRELFPSLRQGTTASSSATTT
                     LNVLSDAGKFVMLPKVVGGYSITIEQVPFQLSVRRRTMHERAYGLGLICGGALISQRV
                     ACSAAHCYAVNNTHNPVRYHDPTMFVVVAGSTQIDQADRHTKEYLVQQIIAHSAYNAS
                     SLENDIALLFLNGYVSWQSRAVRAIPLATKAQTEGTTCLINGWAANLFPKVGKSASLQ
                     QAPVPILNKSLCRAIYMLPVSQLCAGFMQGGIDACQGDSGGPLICDGQLAGIISWGVG
                     CADPGFPGVYTNVSHFVDWIQMVNATLDYSKYTVVGSADLASGAQRTWWLALAFLLIA
                     LGGSWSGGWNLNWNWG"
     misc_feature    314..1033
                     /gene="LOC121403885"
                     /note="Trypsin-like serine protease; Many of these are
                     synthesized as inactive precursor zymogens that are
                     cleaved during limited proteolysis to generate their
                     active forms. Alignment contains also inactive enzymes
                     that have substitutions of the catalytic triad...; Region:
                     Tryp_SPc; cd00190"
                     /db_xref="CDD:238113"
     misc_feature    314..316
                     /gene="LOC121403885"
                     /note="cleavage site [active]"
                     /db_xref="CDD:238113"
     misc_feature    order(458..460,629..631,905..907)
                     /gene="LOC121403885"
                     /note="active site"
                     /db_xref="CDD:238113"
     misc_feature    order(887..889,950..952,956..958)
                     /gene="LOC121403885"
                     /note="substrate binding sites [chemical binding]; other
                     site"
                     /db_xref="CDD:238113"
ORIGIN      
        1 gaacatcgat acatccatca gctacccggc agcttgaaag gcaaaacttt gtttacgttt
       61 tgttattgag ctttagttga gctaaacaaa caaaacaaaa acagggtgcc gtgaagattt
      121 gtatggaatt attacgatgg acacaccgtg gcagctgcag gtgctcttgc agatgcttct
      181 atcgtggaca ttggcggcca acgggcatcg tgagttgttt ccctctctcc gccagggcac
      241 aacagcctcc tcctccgcca caacaactct aaacgtgctc tccgatgcag gcaagttcgt
      301 gatgctgccg aaggtggtgg gcggctattc gataacgatc gaacaggtcc cgttccagct
      361 gtcggtgcgt cgccggacga tgcacgaaag ggcatacgga ttgggcctca tctgtggcgg
      421 ggcattgatc tcgcagcgtg tggcctgctc ggcggcccac tgctatgccg taaacaacac
      481 acacaacccg gtgaggtatc acgatccgac catgttcgtg gtggtggcgg gcagcacaca
      541 aatcgaccag gccgacaggc acaccaagga gtatctggtg cagcaaatca tcgcccacag
      601 cgcctacaat gcctcctcgc tggagaacga catcgcgctg ctcttcctca acggctacgt
      661 gtcgtggcag tcgagggccg tgcgagccat tccgctggcc accaaggccc agactgaggg
      721 caccacgtgc ctgatcaatg gctgggctgc gaatctcttc ccgaaggtgg gcaaatcggc
      781 atcgctgcag caggcgccgg tgcccatcct gaacaagagc ctctgccgtg ccatctacat
      841 gctgccagtg tcccagctgt gcgctggctt catgcagggc ggcatcgatg cctgtcaggg
      901 tgactctggc ggtcccctaa tctgcgacgg ccagctggcg ggcatcatct cgtggggcgt
      961 gggctgtgcg gatcccggct ttcccggcgt ctataccaat gtctcgcact ttgttgattg
     1021 gatccaaatg gtaaacgcca cgctcgacta ctccaaatac acggtggtgg gctcggcgga
     1081 tctggccagc ggtgcccaac gtacctggtg gctggccttg gcatttctgc ttatcgctct
     1141 gggcgggagc tggagcgggg gctggaactt gaactggaac tggggctgat gatgtgcggg
     1201 ccaagatatg gaatgttgga cagcaataat aaaatcatca ttcagcttgt ctcttctgtc
     1261 atttaataat ctaatcatct ccgcatacgc acttgtgtat cgattgccca accatagata
     1321 cagaaatcga attgccgtat gactaaaagg gtgacacaat aaccaatttt aatcagccac
     1381 aaggactggg acagggagtg ggactgggac tgggagtgtt gcgcctgccc ctcaagatca
     1441 aagaccgaga aaacccaacg acctacacct acctccaaga cccaacaaat atcgttttaa
     1501 ctgctcgatt ctgtgggttc caatagataa tatttattaa cggataagag cgcattcaat
     1561 atatctgatt gttatctgat gatatgccaa atcaaatcat aattggatca taaatatgta
     1621 cagacaatac gagaatgaac cgaaaagtac aaacctcctt ttggattttt gattgttgca
     1681 attgccgagc ctcgaacctc ttcaaaatat