PREDICTED: Drosophila obscura trypsin (LOC121403885), transcript


LOCUS       XM_041591967             857 bp    mRNA    linear   INV 14-MAY-2021
            variant X5, mRNA.
ACCESSION   XM_041591967
VERSION     XM_041591967.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..857
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..857
                     /gene="LOC121403885"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 1 Protein, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 6 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:121403885"
     CDS             140..724
                     /gene="LOC121403885"
                     /codon_start=1
                     /product="uncharacterized protein LOC121403885 isoform X5"
                     /protein_id="XP_041447901.1"
                     /db_xref="GeneID:121403885"
                     /translation="MDTPWQLQVLLQMLLSWTLAANGHRELFPSLRQGTTASSSATTT
                     LNVLSDAGKFVMLPKVVGGYSITIEQVPFQLSVRRRTMHERAYGLGLICGGALISQRV
                     ACSAAHCYAVWKQHTQPGEVSRSDHVRGGGGQHTNRPGRQAHQGVSGAANHRPQRLQC
                     LLAGERHRAALPQRLRVVAVEGRASHSAGHQGPD"
     misc_feature    314..>544
                     /gene="LOC121403885"
                     /note="Trypsin-like serine protease; Many of these are
                     synthesized as inactive precursor zymogens that are
                     cleaved during limited proteolysis to generate their
                     active forms. Alignment contains also inactive enzymes
                     that have substitutions of the catalytic triad...; Region:
                     Tryp_SPc; cl21584"
                     /db_xref="CDD:473915"
     misc_feature    317..319
                     /gene="LOC121403885"
                     /note="cleavage site [active]"
                     /db_xref="CDD:238113"
ORIGIN      
        1 tacgaacatc gatacatcca tcagctaccc ggcagcttga aaggcaaaac tttgtttacg
       61 ttttgttatt gagctttagt tgagctaaac aaacaaaaca aaaacagggt gccgtgaaga
      121 tttgtatgga attattacga tggacacacc gtggcagctg caggtgctct tgcagatgct
      181 tctatcgtgg acattggcgg ccaacgggca tcgtgagttg tttccctctc tccgccaggg
      241 cacaacagcc tcctcctccg ccacaacaac tctaaacgtg ctctccgatg caggcaagtt
      301 cgtgatgctg ccgaaggtgg tgggcggcta ttcgataacg atcgaacagg tcccgttcca
      361 gctgtcggtg cgtcgccgga cgatgcacga aagggcatac ggattgggcc tcatctgtgg
      421 cggggcattg atctcgcagc gtgtggcctg ctcggcggcc cactgctatg ccgtgtggaa
      481 acaacacaca caacccggtg aggtatcacg atccgaccat gttcgtggtg gtggcgggca
      541 gcacacaaat cgaccaggcc gacaggcaca ccaaggagta tctggtgcag caaatcatcg
      601 cccacagcgc ctacaatgcc tcctcgctgg agaacgacat cgcgctgctc ttcctcaacg
      661 gctacgtgtc gtggcagtcg agggccgtgc gagccattcc gctggccacc aaggcccaga
      721 ctgagggcac cacgtgcctg atcaatggct ggggtaagat cacaatggtg ggcaaatcgg
      781 catcgctgca gcaggcgccg gtgcccatcc tgaacaagag cctctgccgt gccatctaca
      841 tgctgccagt gtcccag