PREDICTED: Drosophila obscura arginine/serine-rich protein 1


LOCUS       XM_022364250            2421 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072401), transcript variant X2, mRNA.
ACCESSION   XM_022364250
VERSION     XM_022364250.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364250.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..2421
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2421
                     /gene="LOC111072401"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 14 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072401"
     CDS             502..1584
                     /gene="LOC111072401"
                     /codon_start=1
                     /product="arginine/serine-rich protein 1"
                     /protein_id="XP_022219942.1"
                     /db_xref="GeneID:111072401"
                     /translation="MSAARLPYYQQDHSPDKQRRGGRGQRGYSDRNASGSHRRDRSRS
                     VERRRYSRSRSRSRSRSRSAERSGQRRRRDERNDERRQQQPTRYHRERDSRERSRERD
                     RDRDYSRRSGHYRRSDSPASVGGGGVSSSSSQRRHRQSSGGGSEPNAAHNSHNEAQPA
                     NRSNAMSAVGAYYNLDTEEPFDKERIHREMEEKLREALAREGKVYPPRKPEPPSHPVF
                     ANDGSFMELFKKMQQEKRQQLQLGQDYQLESSALASGSTDLQSPIEAHPGIPCLPAIA
                     VGAANSATAPYIAAAAAGKSAPPPPMVGRRRGGKVLKTGMVAKLKTQNEQEVDPKDFW
                     SLYLAEVNKYKSNACDTDNGKRPLVK"
ORIGIN      
        1 ccagaaacgc aatactaatt gcatttgcaa gcaaattgta agcctcggta ttgattccaa
       61 tcgcattaaa agcaaaaccc aaaataccca cgagaaatct tgtggcgaac cgacacacat
      121 acacacacac acgcacttac gcattgacat ctctccgctg ttgaggcttt ggcagcagga
      181 aaaaaagtgc aaagcaaatt acataactcg tttatttgta tatacatcaa ttagtttgag
      241 gtaaaaaatt ctacatcatc tgcataagcc gaatatccga tacgatttca gagtcctcac
      301 aatccaagag tcagagtaaa acaagcacaa atacacacaa gcaagcaggc aagccatcaa
      361 acgggccagc ccagaactac ggataataca gcctggataa tacagtacgc agcccacagg
      421 agcgaacgcg gagaaacatc atctgatctt ggccgacaat catctctcct agtggacgca
      481 acgcaaacaa atcaacccga catgtcggcg gctcgcttgc cctactatca gcaggatcat
      541 tcgccggaca agcagcggcg cggtggacgc ggccagcgtg gctattccga ccgcaacgcc
      601 tctggctctc atagacggga ccgtagccgc tccgtagaac gccgccgcta cagtcgcagc
      661 cgctcacgct ctcgatcccg cagtcgttcc gcagagcgtt cgggccaacg gcggcgacgt
      721 gacgaacgga acgacgagcg acgtcaacag cagccgacgc gctaccaccg cgaaagggat
      781 tccagggagc gttcacggga gcgggatcgc gaccgtgact actccagacg ctctggccat
      841 tatcgtcgtt cagactcgcc tgcatccgtc ggcggaggcg gagtaagttc cagttccagt
      901 cagcggcgcc atcgccaatc atctggaggc ggatcggaac cgaatgccgc acataattca
      961 cacaatgagg cccagccagc taacagatcc aatgccatgt ccgcggtggg agcctattac
     1021 aacctagaca cggaggagcc attcgacaag gagcgcattc atcgtgaaat ggaggagaaa
     1081 ctgcgcgaag ccctggccag agagggcaaa gtttatccgc cacgtaagcc tgagccgccg
     1141 tcgcatcctg tctttgccaa tgatggctcg ttcatggagc tgtttaagaa aatgcagcag
     1201 gagaagaggc agcagctgca gctcggccag gactatcagt tggagagcag tgcactcgca
     1261 tctggcagta cggacctgca gtcaccgata gaggctcatc cgggcatacc ctgcctgccc
     1321 gccattgcag tgggagctgc aaacagtgcg acagcaccct acattgccgc tgcggcagcc
     1381 ggaaaatcag ctccaccgcc ccccatggtg ggaaggcggc gcggcggtaa ggtcctgaag
     1441 accggcatgg tggccaaatt gaagacacaa aatgaacagg aagtggaccc aaaggacttc
     1501 tggtcactat atttagccga ggtcaataag tacaagagca atgcctgcga cacggacaat
     1561 ggcaagcgtc cgttggtcaa gtagggcatg gaaaaatgaa attgaacgca gaagacactc
     1621 cctatggaga cgctcccttc aggagcgatc cttccgtttg gtttgcttta ttccccgcac
     1681 cacaccacac aatccgatca gggcattcac gcgccttcaa gctcacatta aaattactta
     1741 tgtacattat gcaaatgatg gtagatccgc gacagaaatg tagtttgtga aatgtaaatt
     1801 acgacaaatc gatggattct tttttttttt ttatagatat atactattta cggatatata
     1861 tatatatata gtaaatatgt atgtaacttt tgtacacgtt aagggacgaa gccgtagccg
     1921 ctgcctcaat ataagaatat taatgattaa acatagaata gctcataagg ccgtagcata
     1981 gtggatatat acgaactgta tgtgtgtccc tttctatatt atatacatac atacatctac
     2041 atatacatat gtaagaagca tattattagt gcatagaaaa gcgcacattc agcatcgaca
     2101 aaaacatgag gaactaacca atatgattct ttataatcta tctctttctc tcctctccgt
     2161 ctccgttcat gcaccaaaac tcaactcaac tcgaaaccct attccttatt tcattacatt
     2221 ttatttttct tataaataac ttcacgttcc ttccaatctt aaccgactat caaaccgcct
     2281 atctgtcttg tctatatcat tctctctccc ctctctctct ctctctgtat acctatgtac
     2341 cttggtttac aatttgcttg gtttcctttc atttctgtgg tttttccccc tttttttttt
     2401 tttttttttt tgttttctta a