PREDICTED: Drosophila obscura nuclear pore complex protein Nup153


LOCUS       XM_022364379            6776 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072471), mRNA.
ACCESSION   XM_022364379
VERSION     XM_022364379.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; corrected model; includes ab initio.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364379.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio   :: 1% of CDS bases
            frameshifts :: corrected 2 indels
            ##RefSeq-Attributes-END##
PRIMARY     REFSEQ_SPAN         PRIMARY_IDENTIFIER PRIMARY_SPAN        COMP
            1-1296              JAECWW010000165.1  1852381-1853676     c
            1297-1824           JAECWW010000165.1  1851762-1852289     c
            1825-2111           JAECWW010000165.1  1851380-1851666     c
            2112-5067           JAECWW010000165.1  1848312-1851267     c
            5068-5673           JAECWW010000165.1  1847705-1848310     c
            5674-6417           JAECWW010000165.1  1846960-1847703     c
            6418-6606           JAECWW010000165.1  1846688-1846876     c
            6607-6674           JAECWW010000165.1  1844844-1844911     c
            6675-6776           JAECWW010000165.1  1844007-1844108     c
FEATURES             Location/Qualifiers
     source          1..6776
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..6776
                     /gene="LOC111072471"
                     /note="The sequence of the model RefSeq transcript was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 2 bases in 2 codons;
                     Derived by automated computational analysis using gene
                     prediction method: Gnomon. Supporting evidence includes
                     similarity to: 2 Proteins, and 99% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     15 samples with support for all annotated introns"
                     /db_xref="GeneID:111072471"
     CDS             1099..6768
                     /gene="LOC111072471"
                     /note="The sequence of the model RefSeq protein was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 2 bases in 2 codons"
                     /codon_start=1
                     /product="LOW QUALITY PROTEIN: nuclear pore complex
                     protein Nup153"
                     /protein_id="XP_022220071.2"
                     /db_xref="GeneID:111072471"
                     /translation="MSDNEDSPHQNNQTKKQLQLQRNQATTFSTRSGGSTHPLTPLQE
                     ATEAEEGAEDDSAAGTPLVSRKSLMGRVKLRVSNILPSSWFSPTSKAALEAEQEQQEQ
                     QQQQQQQQQNGTGTTGTTSLTKRKRGRRRIELAEPDGEDSPAGGLLPDVDDGAAARGL
                     DYEEVALADNIAEHDLVAEDEQTRRSEYNVFLLRKRRAAIAADDDFDEDDDDVGDGDE
                     EEEEDDDGPAQASISAPTKRRRVELEISVNLPSMRRLPLPLVSSTPAAVASGGQLFTS
                     GNSQVVEGTRSHSRGSNPGGVAPHRRTHLNLYHQRQHRESGYNFFAGNETAAEATTGD
                     LPVSIRRSLNIPAIEHPRSRSFSFGQTQTSSNLSAMPLANHKRPPLLVGQTATARETC
                     RDVVQSENERIERLLNICKSNNNISSSNNNNIIKSKRGAATATGASGAADLESELNEY
                     PEGVEGGDSYPYHHNSNSNLSFYGNLQSAKSIFTRGSAQPPHHNSTCSLNSLNKRQRF
                     NASIYGSSSALSDSRLLTRSASASACGSGSTSSSPFYKGQTTFGGNSAHNRIFGQSAV
                     GGGSSSSLAMNSGGSSPAAHQVTSAVGSPANAGYGGMKPLAMQPSSNQPIIKQPEITN
                     ESVVDSMSLSSTTRRILSLLESYSTPLIDVKRLGNTLKEQQQLQRSTSNPYSRPNRSM
                     LHTDQQQQQQNQQQQQPQSLLAPTMQHILERRRLHRVSQCSKDLLLNYKPNASSAGGS
                     TSMALAALPARHTNNNNNNSHTNKMRSRLSHQSARKEPREDTELAPEPLDLPTINFPA
                     MANTPTFDLVIKPPPPTMPLVAANTTADLQMRPKPPQTAFPMPAVNFVCANVNSGAAA
                     PATAAAHAAFQPSSVSGRGFDFGEPIPILEESARIQGGTAHQTRITRDFSFTEPASLE
                     RQQQQQQQESLPFMNGPTTAAAAHNPSSSQQQVSSVFTLGVGVEGGFSQQFKKSATEW
                     ECDVCMIRNKSELVKCAACETPKPSKTTLPAAAPVPATVPFTGASGFGDRFKKSSSAW
                     ECDTCMVSNKNEANKCVACETPRPGAATAASKTTTTTDCFSITNSPGCGSGSGSGFGS
                     GFSTSSSSSGFGQAFRPKANTWECQTCLVMNQTTAVECVACQSRNPNASSESSSSSST
                     SNPPTNVSSSTSSSSNITSFKFGFPPEQQQQKQQQQQTGVKQDAGFQHLVAAQKAASW
                     ECETCMAMNDQSLSKCCCCEQLRPGADDCKSSSNATHPVPTFTFGFVPKAKEAAPVQP
                     VLSVQPAAVLSTSNIAAPQFSFGFGQSKDVADSKNASMGGFKFGAPATTTSSQEEAKS
                     IDLRAMPTATKATSTTGTETAAVVPAAAPPSQFSFRAPTTTTSTVLSSSSDASIAPAT
                     GTGTAAAAATVTSQVFSFGAPSSLPSSSSAVSSSTHTSGSNSSATSVISSNVKPMFSF
                     SAAVSASGSATPSGVSSSTSQQPTVTTASVGFFGAGTTTNPGGPATTTSTSFAATPAP
                     ALVPAAASAAAPTPAAGLFSFGSASSASSTTKLAPSSNSSTFFFGQTPTSTAAPSSNA
                     TTSIFGAAVTSVASGNNNSTSISFSSSTNAASTAAPAAAAAPTPVTFSFGEKRAASGA
                     PANSLTKPVSFGWPSPSASASPIPSNGSIAPATATATDSSSTTTNLPTVVSSNSVFGS
                     GFGSAFGSTSTASTPASTPAAATSAFGGNGAHPSTGFGFAGNSIASQSSPAPAPSSGP
                     APIFNNAIAPAFGGSNGGGGGGFGGGSNATAAKPAFNFGGSSALSQSAGTSGPFNFGG
                     GGGTGANATSTKPAFNFTGSATVSAAAATPQATTTFNFSASSAIANPLASGDSTPNAN
                     APFQFSAGAPAPANMFAFNPPPAGNAAQNSQMVRRKMRAPVRRLPPR"
     misc_feature    4009..4089
                     /gene="LOC111072471"
                     /note="Zn-finger in Ran binding protein and others;
                     Region: zf-RanBP; pfam00641"
                     /db_xref="CDD:395516"
     misc_feature    4012..4071
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275376"
     misc_feature    4186..4263
                     /gene="LOC111072471"
                     /note="Zn-finger in Ran binding protein and others;
                     Region: zf-RanBP; pfam00641"
                     /db_xref="CDD:395516"
     misc_feature    4186..4245
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275376"
     misc_feature    4300..4356
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275375"
     misc_feature    4414..4503
                     /gene="LOC111072471"
                     /note="Zn-finger in Ran binding protein and others;
                     Region: zf-RanBP; pfam00641"
                     /db_xref="CDD:395516"
     misc_feature    4426..4485
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275375"
     misc_feature    4555..4608
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275375"
     misc_feature    4708..4767
                     /gene="LOC111072471"
                     /note="RanBP2-type Zn finger [structural motif]; Region:
                     RanBP2-type Zn finger"
                     /db_xref="CDD:275375"
ORIGIN      
        1 cgtcgcatta gctacacgcg tttttctcaa atcgtgcttt tttttgtgaa aaaattaaat
       61 taaatttaat ttaattaaag atgttttgcg acacaaatcc ggttggcagt gcgtgcagct
      121 aaaatgattt gagaatagca gggcatacgt tgcgtctctg gctgtacaac tcaagcattt
      181 tgaaaccaaa tgagtgcgtt tgcttgcagg cgaatgccat agctgggtat ctcgcgcgcg
      241 cgtgtgtgtg tgtggtgtat aaaagaattg caaaagaaaa aaacaagacg aaaaaaaaaa
      301 acgaagcgat tgtaggacga aatcaaacag gcaggcggta gggcaaagca aaaaggaaaa
      361 tagcaaaaac gctcttagcg cggcgtgcgg ttagtgtgtt atccggcgca gcgccaagcg
      421 tggatccaag cagaaaccca agcaacagca gtcggcaggc agcggcctcc gccaagctaa
      481 aaaaatatat atatatatgt aaaaaaaaga accccccgcc cgttttgcca tatttggttc
      541 actgacgaaa ttgagtccgc aataaacata atcctcattt gatcgagacg tgaaaaacga
      601 acaatttacc acatacatat gcacatacat catatatgta ccgaattttc tttacaattt
      661 ataatcccga tgtgaatctc atttaaccgc gtctcttgtg cttgcagagg aatatacata
      721 tatttgccgt gtgatggatg gataaataaa taaatacatt cagagctgct gcactttctg
      781 gcgccaaagt gcaaagacac acaaaaaaaa gatcgagaga aaaaaattta aaagaaaaaa
      841 aatcgccgcg tgtgtggaat ctcgtcgaca gaaaaccaat acagtgacac ggcgtgcgta
      901 acacacacac acattgaaca cactcaccca ggattgcaac agtgtgttcc gtttatattt
      961 ctttttttat tttttattgt tgttttgcgc gttagcgcgt gtgtgtggtg tgtgtgtgtg
     1021 ggcgtgtgtt agtttctttt tggttagttt tcattttgtg tgtcgtgccg tgtttcatcg
     1081 ccggcttaaa atccaataat gtcggataat gaggatagtc cacaccaaaa taaccaaaca
     1141 aaaaaacaac tgcagctgca acgaaaccaa gccacaacat tcagcacgag atcgggaggg
     1201 agcacacatc cgctcacgcc acttcaggaa gcgaccgagg ccgaggaggg ggccgaagat
     1261 gattctgctg ccggcacacc cctcgtctcc cgcaaatctc tcatgggaag ggtgaagctg
     1321 cgcgtttcaa atatcctgcc atcgtcatgg ttctcgccaa cctccaaggc ggccttggag
     1381 gccgaacagg agcaacagga gcagcaacaa caacaacaac aacaacaaca gaatggaaca
     1441 ggaacaacgg gaacaacgtc tctaacgaaa aggaaacgtg gacgccgtcg catagagctg
     1501 gccgaaccag atggcgagga ttcacccgct ggaggcctgc tacccgatgt ggatgatggt
     1561 gccgctgcac gaggtctgga ctacgaggag gtggccctgg ccgacaacat agccgagcat
     1621 gacttggttg ccgaggatga gcagacgcga cgcagcgaat acaatgtgtt cctcttgcgc
     1681 aaacggcgcg ctgcgattgc cgccgatgat gattttgatg aagatgacga cgatgtggga
     1741 gatggtgacg aagaggagga ggaggatgac gatggtccag cacaagcgtc catctctgcc
     1801 ccgactaagc gtcgacgtgt ggaactggag ataagcgtca atttgccaag catgcggcga
     1861 ctgccattgc cactggtttc ctctacgccc gccgctgtcg cttccggcgg ccaactattc
     1921 acctcaggca actctcaggt agtggaaggc acccgcagcc atagccgtgg ctccaatccg
     1981 ggtggcgttg ccccgcatcg tcgcacccac ttgaacctct atcaccagcg gcagcatcgt
     2041 gagtcgggct acaatttctt tgcgggcaac gagacggccg ccgaggccac cacaggagat
     2101 ctgccagtca gtatacgtcg atcgctgaac ataccagcca tagagcatcc acgcagtcgc
     2161 agcttcagct ttggacaaac gcaaactagc agcaatttgt ccgccatgcc attggctaac
     2221 cacaagagac cccctctgct ggtggggcag acggccacgg cccgtgagac atgtcgcgat
     2281 gtggtacagt cggagaatga gcggattgag cggctgctga atatctgcaa atccaataat
     2341 aatatcagca gcagcaacaa caacaacatt atcaaatcga agagaggcgc cgccacagcg
     2401 acaggcgcat caggagcagc agatttggag agcgaactga atgaatatcc ggagggagta
     2461 gagggtggcg actcctatcc ctatcatcac aacagcaaca gcaatctatc gttctatggg
     2521 aatttgcaga gcgcaaagtc aatatttaca cgcggctcgg cccagccgcc gcaccacaac
     2581 tcgacttgtt cgctaaactc gcttaacaag cggcagcgct tcaatgcctc catttatggc
     2641 agctcctcgg cattgagcga cagccggctg ttgacacgca gtgcttccgc ctcggcctgt
     2701 gggtccggtt caacatctag ctcgcccttc tacaagggcc agaccacatt cggcggcaat
     2761 tcggcacaca atcgcatctt tgggcagagt gctgttggtg gtggttcctc ctcctcgttg
     2821 gccatgaact ctggaggcag ttcgccggcc gcccatcagg tgacatcggc agttggcagt
     2881 cccgccaatg ccggttacgg cggcatgaag ccattggcca tgcaacccag cagcaatcaa
     2941 cccatcatca agcaaccaga gataacaaac gaatcggtcg tggacagcat gtccctctca
     3001 agcaccacac gtcgcatcct gagcctgctg gagagctact ccacgccact gattgatgtt
     3061 aagcggcttg gcaacaccct aaaggagcag cagcagctgc agcgtagcac cagcaatccc
     3121 tatagccggc ccaatcgttc tatgctgcac acagaccagc aacagcagca gcaaaatcag
     3181 cagcaacagc agccacaaag tctgctggca cccaccatgc agcacatact cgaacgacgt
     3241 cgcctgcatc gtgtcagcca gtgttcgaag gatttgctct tgaattacaa gccaaatgca
     3301 tcatcggccg gtgggtccac ctcaatggcc ctggcggctc tgccagcccg tcacaccaat
     3361 aataataaca ataatagtca cacgaacaag atgcgttccc gactgagtca tcagtcggcg
     3421 cgcaaggagc cgcgcgaaga taccgaactg gcacccgaac cactcgactt gccgacgatc
     3481 aacttcccgg ccatggcaaa tacaccgaca tttgatttgg tcatcaagcc gccgccgcca
     3541 acgatgccat tggtggcagc gaacacaacg gcggatcttc agatgcgtcc caagccgccc
     3601 caaacagcat tccctatgcc tgcggttaat tttgtgtgtg ccaatgtgaa ttctggagca
     3661 gcagcaccag ctacagctgc agctcatgct gcgtttcagc ctagcagcgt atcaggacgt
     3721 ggcttcgatt ttggagaacc catacccata ctggaggaaa gtgcaaggat tcaaggtgga
     3781 actgcacatc aaacgaggat cacgcgcgat ttctccttta cagagccagc ttcattggag
     3841 aggcagcagc agcaacagca gcaagagtct ctgccattta tgaacggccc caccaccgca
     3901 gcagctgcac ataatccaag cagcagccag cagcaagtat catccgtatt cacactggga
     3961 gtgggagtgg aaggaggctt tagccagcag tttaaaaaat cagccactga atgggagtgc
     4021 gatgtgtgca tgatcagaaa taagtcggag ctggttaagt gtgcagcatg cgagacgcca
     4081 aagccttcca agactactct accagctgca gctccagttc cagctacagt cccattcacg
     4141 ggtgccagcg ggttcggaga tcgtttcaag aagtcttcga gtgcctggga atgcgacacg
     4201 tgcatggtat ccaacaagaa tgaggccaac aagtgcgtgg cctgtgagac gccacgcccg
     4261 ggagctgcta cagcggccag caagaccacc accaccaccg actgtttctc aattacaaac
     4321 agcccgggat gcggctccgg ctctggctct ggcttcggat cgggtttctc tacatccagt
     4381 tcgagttccg gatttgggca ggccttcagg cccaaggcca acacatggga gtgccagaca
     4441 tgcctggtga tgaatcagac gacagccgtc gagtgcgtcg cctgccagtc gcgcaatccc
     4501 aatgccagca gcgagtccag ctcgagctcc tccacaagta atcctccaac caatgtctct
     4561 tcaagcacca gcagcagcag taacatcacc agcttcaagt ttggcttccc cccagagcag
     4621 cagcaacaga aacagcagca gcagcagacg ggagttaaac aggatgccgg tttccagcac
     4681 ctggtggctg cccagaaggc agccagctgg gagtgcgaga cgtgcatggc tatgaacgac
     4741 cagtcactct ccaagtgctg ctgctgcgag caactgaggc cgggagccga cgactgcaaa
     4801 tcctcatcca acgccactca ccctgtgccc acgtttacgt tcggttttgt gccaaaagca
     4861 aaggaagcag caccagtcca gccagtactg tcagtccaac cggctgccgt cctgtccaca
     4921 tcgaacatcg ctgctcctca gttctcgttt ggctttggcc agagcaagga tgtggcagac
     4981 agcaagaacg cttcaatggg aggattcaag ttcggagccc cagccaccac caccagcagt
     5041 caggaggagg caaagtcgat cgatctaagg gctatgccga cggccacaaa ggccacatcc
     5101 accacgggaa ccgagacggc agcagttgtt ccagcagcgg ctccccctag ccaattttca
     5161 ttcagagccc ccaccaccac cacatcgaca gtgctgtcat ccagcagcga cgcttccatc
     5221 gctcccgcta ccggtaccgg taccgccgct gccgctgcca ctgtcacgag tcaagtgttc
     5281 agctttggtg ccccgtcatc attaccttca tcatcatcgg ccgtgtccag ttcgacgcat
     5341 acttcgggca gcaactccag cgccaccagc gtgatcagct ccaatgtgaa gccaatgttt
     5401 agcttcagcg ctgccgtctc tgcctctggc tccgccacgc ccagcggcgt tagcagcagc
     5461 acaagccaac agccgacggt gacgacggca tccgtgggct tctttggggc tgggaccacc
     5521 accaatccag gaggaccagc cacaacaact agcacatcgt ttgcagcaac accggctcca
     5581 gcattggttc ctgctgctgc ttctgctgca gcgccaacgc cagcggcagg cttgttcagc
     5641 tttggcagtg catcttcagc tagctccacg acaaagctgg cccccagcag caacagcagc
     5701 accttcttct ttggccagac tccgacatcg acggcagcgc cgagttcaaa tgcgacgacc
     5761 tccatctttg gcgcagcagt aacatcagta gcctcgggta ataataacag cacgtccatt
     5821 agcttcagca gcagcaccaa cgcagcctca actgctgcgc cagccgcagc tgcagctcca
     5881 actccggtga cgtttagctt tggggagaag agagcggcat cgggtgctcc cgcaaacagc
     5941 ctgacaaagc ccgtaagctt tggctggccc agtcccagtg ccagcgctag ccccataccc
     6001 agtaatggca gcatagctcc ggccaccgcc acagccactg acagcagcag caccaccacc
     6061 aacctcccga cggtggtgtc cagcaactct gttttcggca gtggatttgg gtcagctttc
     6121 ggcagtacat cgaccgccag cacaccagca tcaacgccgg cagctgcgac ttcagctttt
     6181 ggcggtaatg gagcacaccc cagcacgggt ttcggctttg cgggtaactc gatagcatcc
     6241 caatcttcgc ctgcgccagc gccctcatca ggcccggctc ctatattcaa caatgccatc
     6301 gcgcctgcct ttggtggcag caatgggggt ggaggtggag gattcggcgg cggaagcaat
     6361 gcaacagctg caaagccagc atttaacttt ggaggctcct cggctctttc ccagtcggcg
     6421 ggcacatctg gacccttcaa ctttggtggt ggcggcggca ccggggccaa tgcgacgtcc
     6481 acaaagccgg cctttaattt tacgggctcg gctactgtgt ccgccgcagc agcaacacca
     6541 caggcgacga ctacctttaa cttttccgcc agttcggcga ttgccaatcc cctagcatcg
     6601 ggcgattcaa cgccaaatgc caacgcaccg ttccaattta gtgccggtgc tccggcgcca
     6661 gccaatatgt tcgccttcaa tccaccgcca gctggaaacg ccgcccagaa ttcacagatg
     6721 gtgcgccgca agatgcgcgc ccccgtgcgc cgtttgccgc cacggtagaa gtggca