PREDICTED: Drosophila obscura regulator of nonsense transcripts 2


LOCUS       XM_022364230            5232 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072391), mRNA.
ACCESSION   XM_022364230
VERSION     XM_022364230.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; corrected model.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364230.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            frameshifts :: corrected 1 indel
            ##RefSeq-Attributes-END##
PRIMARY     REFSEQ_SPAN         PRIMARY_IDENTIFIER PRIMARY_SPAN        COMP
            1-2833              JAECWW010000165.1  1787540-1790372
            2834-3122           JAECWW010000165.1  1790453-1790741
            3123-3854           JAECWW010000165.1  1790803-1791534
            3855-5232           JAECWW010000165.1  1791536-1792913
FEATURES             Location/Qualifiers
     source          1..5232
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..5232
                     /gene="LOC111072391"
                     /note="The sequence of the model RefSeq transcript was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon;
                     Derived by automated computational analysis using gene
                     prediction method: Gnomon. Supporting evidence includes
                     similarity to: 2 Proteins, and 99% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     17 samples with support for all annotated introns"
                     /db_xref="GeneID:111072391"
     CDS             138..3881
                     /gene="LOC111072391"
                     /note="The sequence of the model RefSeq protein was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon"
                     /codon_start=1
                     /product="LOW QUALITY PROTEIN: regulator of nonsense
                     transcripts 2"
                     /protein_id="XP_022219922.2"
                     /db_xref="GeneID:111072391"
                     /translation="MPTNKSGPTVAERPAEIPETATTNSSHAAAAASATATTTSEVEA
                     EAVPEASPNDDGDGDGDDAAKEAEEREELRLFIQELGEKIESKRLMRQQNANIELPGE
                     EFFARLDSSLKKNTAFVKKLKMFTTTQLEPLLRELSALNLSKYISEICAALAEAKLKM
                     NDVPSVVMLSSRLHATYVDFDTHFLEAWQKVLNMKGEKIGNPSKLRVDLRLFAELISS
                     GVIQMKPGLALLGMVLVQLIGQDKDGHNNFSIILSFCRHCGEEYAGLVPQKMQQLALK
                     YDVEVPKSDFLAADKQANLRTMLKGYFKALCKHVLAEQTELMNMTKNIRRTMECKGEI
                     SSEKREKCEMMQASFDKLLASAQTLSELLAEPLPELAKESECCSPGTVIDNMLDSAAL
                     GVLDPWGDEETRAFYTDLPDLRQFLPDFSAPKVDLETMEEPSELTEEAIDANLDAEMD
                     IDDPPSTNSDPPSENTADDQPPPSSTPPLLLAPTGTSPNDLKPQKMCSALMELGRQQL
                     QSQPPTAQTQQQIRQQFDTFLVNLFNCVNKELIDSAAIEFLLNFNTKHQRKKLTRTIF
                     SVQRTRLDILPYLSRFMAVVHMCNTDVAADLSELLRKEFKWHIRKKNQLNIESKLKIV
                     RFIGEQVKFGLFKKFDALGCLKMLLRDFQHHQIEMACAFVEVTGVYLYNCRDSRLLMN
                     VFLDQMLRLKLATAMDSRHAAQIESVYYLVKPPESSKRESAPRPVIHEYIRHLIFEEL
                     CKQNVERCIKMLRRIDWLDPDTSGYAIKCLSKAFLLRFPLIRCLADLVSGLSSYQPRA
                     VTIVIDNVFEDIRAGLEIHSPRMAQRRIAMAKYLGEMYNYKLVESTHILNTLYSIISL
                     GVSTDQSVVSPLDPPESLFRLKLACMLLDTCGPYFTSQATRKKLDYFLMFFQHYYWFK
                     KSHPVFCRDNESSADLFPILVDHTYRDCLGAVRPKLKLYTSLEQAKESIDQLQERLFP
                     HLKSHASNPNLASLNEISELDEGPTDEDSGSSNDQRERQVAGLEPEQSNECTENETDV
                     PMGPPPPPEWSKEDLDFEQQYERMTTDSYQERLKEPVKATAKDIPVPMMARLQKKSYE
                     QITAGSQISKVSSCPDLPPRSPAPDLPESSSGKTAASNAGGTGGGGGGGGATPAAAAA
                     VPFVLMVRGNRGGKQQFKSFVCASDSHLAINLKVQEQKIREEKEKVKRLTLNITERIE
                     EEDYQESLLPPQHRNFTQSYYQKPNRQKFKHQKGAPDADLIFH"
     misc_feature    471..1058
                     /gene="LOC111072391"
                     /note="Middle domain of eukaryotic initiation factor 4G
                     (eIF4G); Region: MIF4G; smart00543"
                     /db_xref="CDD:214713"
     misc_feature    1731..2282
                     /gene="LOC111072391"
                     /note="Middle domain of eukaryotic initiation factor 4G
                     (eIF4G); Region: MIF4G; smart00543"
                     /db_xref="CDD:214713"
     misc_feature    2325..2903
                     /gene="LOC111072391"
                     /note="Middle domain of eukaryotic initiation factor 4G
                     (eIF4G); Region: MIF4G; smart00543"
                     /db_xref="CDD:214713"
     misc_feature    3261..3731
                     /gene="LOC111072391"
                     /note="Up-frameshift suppressor 2; Region: Upf2;
                     pfam04050"
                     /db_xref="CDD:461146"
ORIGIN      
        1 tccgcggtca cactacatcc aacaaatgaa acaaatttgc ctgaaacttc ccagatattt
       61 ctgatatttc tgttttgtaa ttacaaaaca acatcgaggc tagcgtgaga caaatcatat
      121 tacttacatt tgccgccatg cccactaaca agtcgggccc aactgtggca gagagaccgg
      181 ccgagatacc ggaaaccgcg acaacaaact catcccatgc tgccgcagcc gccagcgcca
      241 ccgccacaac aacatccgag gtagaagcag aagcagtccc agaggcgtcg ccgaacgatg
      301 acggtgatgg cgatggcgat gatgctgcca aagaggcaga ggagcgcgaa gaattgcggc
      361 tgttcatcca agagctgggt gagaaaatcg agagcaagcg gctgatgcgt cagcaaaatg
      421 ccaacatcga gcttcccggc gaggagttct ttgcccgcct cgactccagt ctcaagaaga
      481 acacggcgtt tgtgaagaag ctgaaaatgt tcaccaccac gcagctggag ccgctgctcc
      541 gcgagctgtc cgccttgaat ctaagcaagt atatttcgga gatatgtgcc gccctggcgg
      601 aagccaagct caagatgaac gatgtgcctt cggtggtgat gctatcctcg cgcctgcacg
      661 ccacctatgt ggacttcgac acgcacttcc tggaagcctg gcagaaggtg ctgaacatga
      721 agggcgagaa gatcggcaac ccgagcaagc tgcgcgtcga tctgcgtctc ttcgccgagc
      781 ttatcagctc gggtgttatc cagatgaagc ccggcctggc cctgctgggc atggtgctgg
      841 tgcagctaat cggccaggac aaggacgggc ataacaactt ctcgattata ctctcgtttt
      901 gccgccactg cggcgaggag tacgctggcc tggtaccgca gaaaatgcaa caactggctc
      961 tcaagtacga cgtggaggtg cccaaatccg atttcctggc agcggacaag caggcaaact
     1021 tgcgcaccat gctcaagggc tacttcaagg ccctgtgcaa gcatgtcctg gccgagcaga
     1081 ccgaactgat gaacatgacg aagaacatac gtcgcacgat ggagtgcaag ggcgagatct
     1141 catcggagaa gcgtgaaaag tgcgaaatga tgcaggcgag cttcgacaag ctgctggcct
     1201 ctgcccagac gctgtcggaa ctgttggccg aaccgctgcc agagctggcc aaggagtcgg
     1261 agtgctgcag tccgggcaca gtgattgaca atatgctgga cagtgccgcc ttgggggtgc
     1321 tcgatccttg gggcgatgag gagacacgtg ccttttacac agatctgccc gatctgcgcc
     1381 agttcctacc cgacttctcc gcccccaagg tggacctaga gacgatggag gagcccagcg
     1441 aactgaccga agaggccatc gatgccaatc tagatgccga aatggatatc gatgatccac
     1501 cctccaccaa ttcggatccg ccgtctgaga acactgccga cgaccagccg ccaccaagca
     1561 gcactccacc gctgctgctg gcccccacgg gcacctcgcc gaacgacttg aagccgcaga
     1621 agatgtgcag cgctctgatg gaactgggac gccagcagct gcaaagccag ccgccgacgg
     1681 cccagacaca gcaacagata cgccagcaat tcgatacatt tctcgtgaat ctcttcaatt
     1741 gcgtcaacaa ggagcttatc gactcggccg ccatcgaatt tctgctcaac ttcaacacaa
     1801 aacaccagcg caagaagctg acccgaacga ttttctcggt gcagcgcacc cgcctggata
     1861 ttctgcccta tctgtcgcgc ttcatggccg tcgttcacat gtgcaacacg gacgtggccg
     1921 ccgatctgtc cgagctgctg cgcaaggagt tcaagtggca tatacgcaaa aagaatcaac
     1981 tgaatatcga gtccaagctg aagatagtgc gtttcattgg cgagcaggtg aaattcggcc
     2041 tgttcaagaa attcgacgcc ctcggatgcc tcaagatgct gctgcgcgac tttcagcatc
     2101 atcagatcga gatggcatgc gcatttgtgg aggtgactgg tgtatatctg tacaattgtc
     2161 gcgactcccg tctgctcatg aacgtcttcc tcgaccaaat gctgcgcctg aagctggcca
     2221 ccgccatgga ctcgcgtcat gcggcccaaa ttgaaagtgt ctactatctg gtgaagccgc
     2281 cagagtcatc caagcgcgag tcagccccac gtcccgtcat tcacgagtac atacgccacc
     2341 tgatcttcga ggagctgtgc aagcagaacg ttgagcgttg catcaaaatg ctgcgtcgca
     2401 tcgactggct ggatccggat accagcggct atgccatcaa gtgcctgagc aaagcatttc
     2461 tattgcgctt cccactcatc cgctgcctgg ccgatctggt gtccgggctc agttcgtacc
     2521 agccgcgggc cgtcaccatt gtcattgata atgtgttcga ggatatacgc gccgggctcg
     2581 agatacattc gccgcgcatg gcacagcgtc gcattgccat ggccaagtat ttgggcgaaa
     2641 tgtacaacta caagctggtg gagtccacac acatactgaa taccctgtac tccattatct
     2701 cgctgggtgt gtccacggat cagagtgtgg tgtcgccgtt ggatccgccg gagagcctgt
     2761 ttcgcctgaa gctggcctgc atgctactcg acacctgcgg cccctacttc accagccagg
     2821 ccacgcgcaa gaagctggac tatttcctga tgtttttcca gcactattac tggttcaaga
     2881 agtcccatcc cgtcttctgt agggataatg agagctcggc ggatctcttt cccatactgg
     2941 tcgatcacac atatcgcgac tgtctgggcg ctgtccggcc caagctgaag ctttatacta
     3001 gcctggagca ggccaaggag tccattgatc agttgcagga gcgactcttt ccccatctga
     3061 aatcgcatgc cagcaatccc aatctggcta gcctcaatga gatcagtgag ctggacgaag
     3121 ggcccactga cgaggattct ggcagctcga acgatcagcg agagcgtcag gttgccggcc
     3181 tggagccgga gcagagcaac gaatgtactg aaaatgagac agatgttcca atgggaccac
     3241 cgccaccgcc ggaatggtcc aaggaggact tggacttcga gcagcaatat gaaagaatga
     3301 cgacagattc gtatcaggaa cggctgaagg agcccgttaa ggctaccgcc aaggacatac
     3361 ccgtacccat gatggcgcgt ctgcagaaga agtcatacga acagatcaca gccggatcac
     3421 agatctcaaa ggtatccagc tgtccagatc tgcctccccg ctcgccagca cccgatctgc
     3481 ccgagagctc ctcaggcaag acagcggcca gcaatgctgg tggaactggt ggaggaggag
     3541 gagggggagg ggcaacgcca gctgcagcgg ctgctgttcc atttgtgctg atggtgcgcg
     3601 gcaacagggg cggaaagcag caatttaaat cgtttgtctg tgcctcggac tcgcacttgg
     3661 ccatcaatct gaaggtgcag gagcagaaaa tacgcgagga gaaggagaag gtgaagcgcc
     3721 tcacactgaa catcaccgag cgcattgagg aggaggacta tcaggagtca ctactgccgc
     3781 cgcagcatcg aaatttcact cagagctact accagaaacc caacagacaa aagttcaaac
     3841 accagaaggg cgccccagat gcggatctca tatttcactg agacgcccag cagccacagc
     3901 cctcaggccg acgacaacag accaatccaa gtcaagttaa caatcaggga atgcgctcac
     3961 ggactcacac tggcatcgca gcaaccatgg ttaaagcggg aagatggatg gtgcctccaa
     4021 caacagcaac aacaacattc aagtttacaa atagttgtcg aaatattgta acaggcaaca
     4081 ggaatacgaa cgggagagag agagaaggtg ctccaagaga ccttgattct ccgatacaca
     4141 ccgatccaca ccgtgttcca tgtgcaatcc tctggtacag ggacacacac acacggatat
     4201 acagacgttt ttataccgta cttaagttga gctctcacca cacagcgctc gtccgcttta
     4261 taccaacgcc agcgcgttag catgcccacg agattctaca ctcattgcca atgccatgcc
     4321 acagatcgtg cggcatggca gctcaagata ttgtaaggct ctccacaacg ccccccgcca
     4381 accccaaaca atatccttcg ctatggtgca catagagagc acagccgatc ccttaaaatt
     4441 aaccatatac acatacatac atatagtacg tacaattgca tcgacttgtt ttgaaaacaa
     4501 acctaccccc tactgatcga ttgatatata aaaagtgcat atataccata tacatatgtt
     4561 ttttgtaaat atatacatac atacatacat atgtatccgt acacatacac gcccgtaact
     4621 gaaaccgaaa ccacccaact gatggctgtt tcccctccgc ccacagagag caggaatata
     4681 ctataccact tacttacatt agatcagggg aatatatcta atctatacag atttgatata
     4741 tattcatatt tatacacgcg catgtatagt taatgggttt ccactccacc tccacctccc
     4801 ctcccctcca ctcccttgct gtcttgactg gacatcgaca cactaaaata gtgcatacct
     4861 tcccaagact cgtttgactt ttgaattttt atttgttttt cgttttattt tatttgctct
     4921 aaaattagcg tcaaacaatt tgattttgat ttatttttaa atttcctctt catcttatcc
     4981 cattgtatat tgccagtgtg ttggtgtatt cgttaaataa caatattcca aaatgtttta
     5041 cgcttttttt ttatgcttct ttttttgttg cttgcttata caaatgtttt cgttcgtttg
     5101 tttggtttta cttttaaaat gttaatcagt aatcagtaca aatggcaaaa gatataatat
     5161 ttatatagta gtattaattc actattaatg aacgaaaatc gattaaaaac aaaaacacac
     5221 acaaaagaga cg