PREDICTED: Drosophila obscura arginine/serine-rich protein 1


LOCUS       XM_022364251            2797 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072401), transcript variant X3, mRNA.
ACCESSION   XM_022364251
VERSION     XM_022364251.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364251.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..2797
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2797
                     /gene="LOC111072401"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 4 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072401"
     CDS             878..1960
                     /gene="LOC111072401"
                     /codon_start=1
                     /product="arginine/serine-rich protein 1"
                     /protein_id="XP_022219943.1"
                     /db_xref="GeneID:111072401"
                     /translation="MSAARLPYYQQDHSPDKQRRGGRGQRGYSDRNASGSHRRDRSRS
                     VERRRYSRSRSRSRSRSRSAERSGQRRRRDERNDERRQQQPTRYHRERDSRERSRERD
                     RDRDYSRRSGHYRRSDSPASVGGGGVSSSSSQRRHRQSSGGGSEPNAAHNSHNEAQPA
                     NRSNAMSAVGAYYNLDTEEPFDKERIHREMEEKLREALAREGKVYPPRKPEPPSHPVF
                     ANDGSFMELFKKMQQEKRQQLQLGQDYQLESSALASGSTDLQSPIEAHPGIPCLPAIA
                     VGAANSATAPYIAAAAAGKSAPPPPMVGRRRGGKVLKTGMVAKLKTQNEQEVDPKDFW
                     SLYLAEVNKYKSNACDTDNGKRPLVK"
ORIGIN      
        1 ccagaaacgc aatactaatt gcatttgcaa gcaaattgta agcctcggta ttgattccaa
       61 tcgcattaaa agcaaaaccc aaaataccca cgagaaatct tgtggcgaac cgacacacat
      121 acacacacac acgcacttac gcattgacat ctctccgctg ttgaggcttt ggcagcagga
      181 aaaaaagtgc aaagcaaatt acataactcg tttatttgta tatacatcaa ttagtttgag
      241 gtaaaaaatt ctacatcatc tgcataagcc gaatatccga tacgatttca gagtcctcac
      301 aatccaagag tcagagtaaa acaagcacaa atacacacaa gcaagcaggc aagccatcaa
      361 acgggccagc ccagaactac ggataataca gcctggataa tacagtacgc agcccacagg
      421 agcgaacgcg gagaaacatc atctgatctt ggccgacaat catctctcct agtggacgca
      481 acgcaaacaa gtaaatttta ccatatctca ttttaatcaa gtcaatcaag aatcgaaaaa
      541 taacaagaac aagaaatcaa caatcaagga ctcactctcg agtctactaa atccaagtac
      601 aagtatccaa attgcataag aatccccatg tgcgggtata tcttgtgagg tggtgctcag
      661 ttcttattca gtatattctc gttgcctcat ctggctgggt gctggctgct aagctgctgg
      721 ctgctcgctg cagctccagc caggtcggag gaaaccagaa actgcttgac gacccacaag
      781 gaacgattag ctcgattttg aaccgcagaa cttacagata tacagaaaaa aaaacagata
      841 cagatacaga tattgtgtat gcatagatca acccgacatg tcggcggctc gcttgcccta
      901 ctatcagcag gatcattcgc cggacaagca gcggcgcggt ggacgcggcc agcgtggcta
      961 ttccgaccgc aacgcctctg gctctcatag acgggaccgt agccgctccg tagaacgccg
     1021 ccgctacagt cgcagccgct cacgctctcg atcccgcagt cgttccgcag agcgttcggg
     1081 ccaacggcgg cgacgtgacg aacggaacga cgagcgacgt caacagcagc cgacgcgcta
     1141 ccaccgcgaa agggattcca gggagcgttc acgggagcgg gatcgcgacc gtgactactc
     1201 cagacgctct ggccattatc gtcgttcaga ctcgcctgca tccgtcggcg gaggcggagt
     1261 aagttccagt tccagtcagc ggcgccatcg ccaatcatct ggaggcggat cggaaccgaa
     1321 tgccgcacat aattcacaca atgaggccca gccagctaac agatccaatg ccatgtccgc
     1381 ggtgggagcc tattacaacc tagacacgga ggagccattc gacaaggagc gcattcatcg
     1441 tgaaatggag gagaaactgc gcgaagccct ggccagagag ggcaaagttt atccgccacg
     1501 taagcctgag ccgccgtcgc atcctgtctt tgccaatgat ggctcgttca tggagctgtt
     1561 taagaaaatg cagcaggaga agaggcagca gctgcagctc ggccaggact atcagttgga
     1621 gagcagtgca ctcgcatctg gcagtacgga cctgcagtca ccgatagagg ctcatccggg
     1681 cataccctgc ctgcccgcca ttgcagtggg agctgcaaac agtgcgacag caccctacat
     1741 tgccgctgcg gcagccggaa aatcagctcc accgcccccc atggtgggaa ggcggcgcgg
     1801 cggtaaggtc ctgaagaccg gcatggtggc caaattgaag acacaaaatg aacaggaagt
     1861 ggacccaaag gacttctggt cactatattt agccgaggtc aataagtaca agagcaatgc
     1921 ctgcgacacg gacaatggca agcgtccgtt ggtcaagtag ggcatggaaa aatgaaattg
     1981 aacgcagaag acactcccta tggagacgct cccttcagga gcgatccttc cgtttggttt
     2041 gctttattcc ccgcaccaca ccacacaatc cgatcagggc attcacgcgc cttcaagctc
     2101 acattaaaat tacttatgta cattatgcaa atgatggtag atccgcgaca gaaatgtagt
     2161 ttgtgaaatg taaattacga caaatcgatg gattcttttt ttttttttat agatatatac
     2221 tatttacgga tatatatata tatatagtaa atatgtatgt aacttttgta cacgttaagg
     2281 gacgaagccg tagccgctgc ctcaatataa gaatattaat gattaaacat agaatagctc
     2341 ataaggccgt agcatagtgg atatatacga actgtatgtg tgtccctttc tatattatat
     2401 acatacatac atctacatat acatatgtaa gaagcatatt attagtgcat agaaaagcgc
     2461 acattcagca tcgacaaaaa catgaggaac taaccaatat gattctttat aatctatctc
     2521 tttctctcct ctccgtctcc gttcatgcac caaaactcaa ctcaactcga aaccctattc
     2581 cttatttcat tacattttat ttttcttata aataacttca cgttccttcc aatcttaacc
     2641 gactatcaaa ccgcctatct gtcttgtcta tatcattctc tctcccctct ctctctctct
     2701 ctgtatacct atgtaccttg gtttacaatt tgcttggttt cctttcattt ctgtggtttt
     2761 tccccctttt tttttttttt tttttttgtt ttcttaa