PREDICTED: Drosophila obscura arginine/serine-rich protein 1


LOCUS       XM_022364249            2433 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072401), transcript variant X1, mRNA.
ACCESSION   XM_022364249
VERSION     XM_022364249.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364249.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..2433
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2433
                     /gene="LOC111072401"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 14 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072401"
     CDS             514..1596
                     /gene="LOC111072401"
                     /codon_start=1
                     /product="arginine/serine-rich protein 1"
                     /protein_id="XP_022219941.1"
                     /db_xref="GeneID:111072401"
                     /translation="MSAARLPYYQQDHSPDKQRRGGRGQRGYSDRNASGSHRRDRSRS
                     VERRRYSRSRSRSRSRSRSAERSGQRRRRDERNDERRQQQPTRYHRERDSRERSRERD
                     RDRDYSRRSGHYRRSDSPASVGGGGVSSSSSQRRHRQSSGGGSEPNAAHNSHNEAQPA
                     NRSNAMSAVGAYYNLDTEEPFDKERIHREMEEKLREALAREGKVYPPRKPEPPSHPVF
                     ANDGSFMELFKKMQQEKRQQLQLGQDYQLESSALASGSTDLQSPIEAHPGIPCLPAIA
                     VGAANSATAPYIAAAAAGKSAPPPPMVGRRRGGKVLKTGMVAKLKTQNEQEVDPKDFW
                     SLYLAEVNKYKSNACDTDNGKRPLVK"
ORIGIN      
        1 cagaaacgca atactaattg catttgcaag caaattgtaa gcctcggtat tgattccaat
       61 cgcattaaaa gcaaaaccca aaatacccac gagaaatctt gtggcgaacc gacacacata
      121 cacacacaca cgcacttacg cattgacatc tctccgctgt tgaggctttg gcagcaggaa
      181 aaaaagtgca aagcaaatta cataactcgt ttatttgtat atacatcaat tagtttgagg
      241 taaaaaattc tacatcatct gcataagccg aatatccgat acgatttcag agtcctcaca
      301 atccaagagt cagagtaaaa caagcacaaa tacacacaag caagcaggca agccatcaaa
      361 cgggccagcc cagaactacg gataatacag cctggataat acagtacgca gcccacagga
      421 gcgaacgcgg agaaacatca tctgatcttg gccgacaatc atctctccta gtggacgcaa
      481 cgcaaacaat ttcgaattgc agatcaaccc gacatgtcgg cggctcgctt gccctactat
      541 cagcaggatc attcgccgga caagcagcgg cgcggtggac gcggccagcg tggctattcc
      601 gaccgcaacg cctctggctc tcatagacgg gaccgtagcc gctccgtaga acgccgccgc
      661 tacagtcgca gccgctcacg ctctcgatcc cgcagtcgtt ccgcagagcg ttcgggccaa
      721 cggcggcgac gtgacgaacg gaacgacgag cgacgtcaac agcagccgac gcgctaccac
      781 cgcgaaaggg attccaggga gcgttcacgg gagcgggatc gcgaccgtga ctactccaga
      841 cgctctggcc attatcgtcg ttcagactcg cctgcatccg tcggcggagg cggagtaagt
      901 tccagttcca gtcagcggcg ccatcgccaa tcatctggag gcggatcgga accgaatgcc
      961 gcacataatt cacacaatga ggcccagcca gctaacagat ccaatgccat gtccgcggtg
     1021 ggagcctatt acaacctaga cacggaggag ccattcgaca aggagcgcat tcatcgtgaa
     1081 atggaggaga aactgcgcga agccctggcc agagagggca aagtttatcc gccacgtaag
     1141 cctgagccgc cgtcgcatcc tgtctttgcc aatgatggct cgttcatgga gctgtttaag
     1201 aaaatgcagc aggagaagag gcagcagctg cagctcggcc aggactatca gttggagagc
     1261 agtgcactcg catctggcag tacggacctg cagtcaccga tagaggctca tccgggcata
     1321 ccctgcctgc ccgccattgc agtgggagct gcaaacagtg cgacagcacc ctacattgcc
     1381 gctgcggcag ccggaaaatc agctccaccg ccccccatgg tgggaaggcg gcgcggcggt
     1441 aaggtcctga agaccggcat ggtggccaaa ttgaagacac aaaatgaaca ggaagtggac
     1501 ccaaaggact tctggtcact atatttagcc gaggtcaata agtacaagag caatgcctgc
     1561 gacacggaca atggcaagcg tccgttggtc aagtagggca tggaaaaatg aaattgaacg
     1621 cagaagacac tccctatgga gacgctccct tcaggagcga tccttccgtt tggtttgctt
     1681 tattccccgc accacaccac acaatccgat cagggcattc acgcgccttc aagctcacat
     1741 taaaattact tatgtacatt atgcaaatga tggtagatcc gcgacagaaa tgtagtttgt
     1801 gaaatgtaaa ttacgacaaa tcgatggatt cttttttttt ttttatagat atatactatt
     1861 tacggatata tatatatata tagtaaatat gtatgtaact tttgtacacg ttaagggacg
     1921 aagccgtagc cgctgcctca atataagaat attaatgatt aaacatagaa tagctcataa
     1981 ggccgtagca tagtggatat atacgaactg tatgtgtgtc cctttctata ttatatacat
     2041 acatacatct acatatacat atgtaagaag catattatta gtgcatagaa aagcgcacat
     2101 tcagcatcga caaaaacatg aggaactaac caatatgatt ctttataatc tatctctttc
     2161 tctcctctcc gtctccgttc atgcaccaaa actcaactca actcgaaacc ctattcctta
     2221 tttcattaca ttttattttt cttataaata acttcacgtt ccttccaatc ttaaccgact
     2281 atcaaaccgc ctatctgtct tgtctatatc attctctctc ccctctctct ctctctctgt
     2341 atacctatgt accttggttt acaatttgct tggtttcctt tcatttctgt ggtttttccc
     2401 cctttttttt tttttttttt tttgttttct taa