PREDICTED: Drosophila obscura serine/arginine repetitive matrix


LOCUS       XM_041591971            2224 bp    mRNA    linear   INV 14-MAY-2021
            protein 1-like (LOC121403886), mRNA.
ACCESSION   XM_041591971
VERSION     XM_041591971.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; corrected model; includes ab initio.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio   :: 1% of CDS bases
            frameshifts :: corrected 1 indel
            ##RefSeq-Attributes-END##
PRIMARY     REFSEQ_SPAN         PRIMARY_IDENTIFIER PRIMARY_SPAN        COMP
            1-184               JAECWW010000165.1  81495-81678         c
            185-282             JAECWW010000165.1  63083-63180         c
            283-388             JAECWW010000165.1  35737-35842         c
            389-934             JAECWW010000165.1  35121-35666         c
            935-1648            JAECWW010000165.1  33919-34632         c
            1649-1836           JAECWW010000165.1  33730-33917         c
            1837-1940           JAECWW010000165.1  33561-33664         c
            1941-2050           JAECWW010000165.1  19282-19391         c
            2051-2224           JAECWW010000165.1  18785-18958         c
FEATURES             Location/Qualifiers
     source          1..2224
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2224
                     /gene="LOC121403886"
                     /note="The sequence of the model RefSeq transcript was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon;
                     Derived by automated computational analysis using gene
                     prediction method: Gnomon. Supporting evidence includes
                     similarity to: 3 Proteins, and 99% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     3 samples with support for all annotated introns"
                     /db_xref="GeneID:121403886"
     CDS             221..2224
                     /gene="LOC121403886"
                     /note="The sequence of the model RefSeq protein was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon"
                     /codon_start=1
                     /product="LOW QUALITY PROTEIN: serine/arginine repetitive
                     matrix protein 1-like"
                     /protein_id="XP_041447905.1"
                     /db_xref="GeneID:121403886"
                     /translation="MMAERTINWAMDAEMGMIKLKTMTAVCFVCNLPIMSHQVGLVWS
                     GGNGWDDLVREQLEESTIRQRLGGRRDSAAQITTPPSTSPPPGLQRRRRSSLAQLTDI
                     LREWSGGTKQQTQQQQQQQAQQQARNKGQLNRRETLADLARSLPWRTSTTDASTGAGG
                     AGAGTGSSTSGGNITYIAPRKRRESSADSGIRSIRSRRESNTAEFVKHWNRRESTAVE
                     EQAPSHISVNVVVVETTTKSASRRGSGESYLSSSRRDSNVAGRVTTPPPPPKYQVTKK
                     RDSLAAPEFPNFRQEQRPSTSSAGSCHSDSVSVPLIQYHQQVDSACQALPPPTIITSS
                     VTPPATSPTAPKGRRDSTTQCGRVNRRDSKAGHSPERAPRMNRLQRQATAFDESVLPG
                     GSRRGSQPALSPDPPEDCERRASRRDSLSPDSASRGGRRDSRTHLSPDRTHERDGSPR
                     RHTLRRQSSSAARHSPESNSCGSSRDPSPCSRPPPLPAVEQNQRPAIRRQSTTEEILI
                     ARGFRRQSTTEEMIRCRNFRRQSSQSDDVCRYRGRRDSSAQIIDGTIGTMTVETTSTF
                     FDSSTQTEPSPLYDNNHYHEECLRCNSCGLNLTGPNQRRARRFKNQILCDLHFADVAL
                     MECSDFMQQLRSFKPQSLGCAVARRKSSTTLIFPLPPQACSGM"
     misc_feature    1013..>1777
                     /gene="LOC121403886"
                     /note="transcriptional regulator ICP4; Provisional;
                     Region: PHA03307"
                     /db_xref="CDD:223039"
     misc_feature    <1937..2074
                     /gene="LOC121403886"
                     /note="Zinc-binding domain present in Lin-11, Isl-1,
                     Mec-3; Region: LIM; smart00132"
                     /db_xref="CDD:214528"
ORIGIN      
        1 ttgaatcctc ttcaaatata catacaaaca aaaaaatata tcagacacta agaaaatcta
       61 agaatatata agacatatca actaaagata tcgagccgat attccactga agaaatcggc
      121 atgcaaagta ctaacataaa acgaaactaa cgagagagtc cacgattcca aggaagcaaa
      181 aaattttttt gttgtctaac atccaaggtc cgatgctcac atgatggccg aaagaacgat
      241 caattgggcc atggatgccg agatgggcat gattaagctc aagacaatga cagcggtatg
      301 ctttgtgtgc aacctgccca tcatgtcaca tcaggtgggt ctggtgtggt caggtggcaa
      361 cggctgggac gacctcgtcc gcgaacagct ggaagagtca acgatccgtc agcgattagg
      421 cggacgtcgc gattccgccg cccagatcac aaccccaccg agcacgtcgc caccgccagg
      481 acttcaacgg cggcggcgca gctccttggc ccaacttact gacattctgc gcgagtggag
      541 cggcggcacc aagcaacaga cccaacagca gcagcagcaa caggcccagc agcaggcccg
      601 caacaagggt cagctgaatc ggcgcgaaac gcttgccgat ctcgcccgca gcctgccctg
      661 gcggacatcg acgacagatg cgagcactgg tgctggtggt gctggggctg ggactggttc
      721 cagtaccagt gggggcaata tcacgtacat tgccccacgc aagcgtcgcg agtcgagcgc
      781 cgattccggc atacgcagca tcagatctcg ccgcgaatcg aacacggccg agttcgtgaa
      841 gcactggaac aggcgcgaga gcaccgccgt cgaggagcaa gcaccaagcc acatttccgt
      901 gaatgtggtg gtcgtcgaaa ctaccactaa gagcgcctcg cgccgcggat ccggggagag
      961 ctacctgtcg agcagccggc gggacagcaa tgtcgccggc cgcgtgacaa cgccgccacc
     1021 gccacccaag taccaggtga ccaagaagcg ggactcgctc gccgccccgg agttccccaa
     1081 cttccggcag gagcagcgcc cctccaccag ctccgccggc tcctgtcact ccgactccgt
     1141 ctccgtgcca ctaatccagt accatcagca ggtggactcc gcatgccagg ccctgccgcc
     1201 gcccaccatc atcaccagct cggtgacgcc gccggccacc agtccaacgg caccgaaggg
     1261 tcggcgcgac tccaccacac agtgcggccg cgtcaatcgg cgcgactcga aggcgggcca
     1321 cagtccggag cgcgcaccgc gcatgaaccg cctgcagcgg caggcgacgg ccttcgacga
     1381 gagcgttctg cctggcggca gtcgacgcgg ctcccagcca gccctcagcc cggatccgcc
     1441 cgaggattgt gagcgccgtg cctcgcgccg cgactccctt tcgccggaca gcgcctcgcg
     1501 cggcggacga cgcgactcgc gcacccatct ctcgcccgac cgcacacacg agcgcgacgg
     1561 cagtccacgg cgacacacgc tgcgccgcca gagcagctcg gcggcccgcc actcgcccga
     1621 atcgaacagc tgcggctcgt cgcgggatcc cagtccgtgc tcccggccac caccgttgcc
     1681 ggctgtggaa cagaaccaga gacccgccat caggcgccag tccaccaccg aggagatcct
     1741 cattgcgcgc ggctttcggc gccagtccac cacggaggag atgatacgct gccgcaactt
     1801 ccggcgccag agctcccaga gcgatgacgt ctgtcgctac cgcggacgtc gcgattcatc
     1861 ggctcagatc attgacggta ccatcggcac catgaccgtg gagaccacca gcactttctt
     1921 cgactccagc actcagacag aaccatcgcc gctgtacgac aacaaccact accatgagga
     1981 gtgtctgcgg tgcaactcgt gcggcttgaa tttgacagga cccaaccaga ggcgcgccag
     2041 gaggttcaag aaccagatcc tgtgcgacct gcatttcgca gacgtggccc taatggagtg
     2101 ctccgatttt atgcagcagc tgcggagctt caagccccaa tcgctgggct gtgcggtggc
     2161 gcgacgcaag agctccacga cgttaatatt tccattgccg ccgcaagcat gttcaggtat
     2221 gtag