PREDICTED: Drosophila obscura Alstrom syndrome protein 1 homolog a


LOCUS       XM_022364326            3731 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072447), mRNA.
ACCESSION   XM_022364326
VERSION     XM_022364326.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; corrected model; includes ab initio.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364326.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio   :: 1% of CDS bases
            frameshifts :: corrected 1 indel
            ##RefSeq-Attributes-END##
PRIMARY     REFSEQ_SPAN         PRIMARY_IDENTIFIER PRIMARY_SPAN        COMP
            1-1499              JAECWW010000165.1  2003343-2004841
            1500-1741           JAECWW010000165.1  2004909-2005150
            1742-2740           JAECWW010000165.1  2005152-2006150
            2741-3398           JAECWW010000165.1  2006226-2006883
            3399-3547           JAECWW010000165.1  2006954-2007102
            3548-3731           JAECWW010000165.1  2007170-2007353
FEATURES             Location/Qualifiers
     source          1..3731
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3731
                     /gene="LOC111072447"
                     /note="The sequence of the model RefSeq transcript was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon;
                     Derived by automated computational analysis using gene
                     prediction method: Gnomon. Supporting evidence includes
                     similarity to: 5 Proteins, and 99% coverage of the
                     annotated genomic feature by RNAseq alignments, including
                     15 samples with support for all annotated introns"
                     /db_xref="GeneID:111072447"
     CDS             164..3610
                     /gene="LOC111072447"
                     /note="The sequence of the model RefSeq protein was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: deleted 1 base in 1 codon"
                     /codon_start=1
                     /product="LOW QUALITY PROTEIN: Alstrom syndrome protein 1
                     homolog a"
                     /protein_id="XP_022220018.2"
                     /db_xref="GeneID:111072447"
                     /translation="MPGHQRIGTHLRKHTDEKRLLASRVPPKAREYLSELAVDRELER
                     FMALSSTNSSGTSRSNVSMYTAPLHCTPRSVSVAPSKPARCSGGSGGKTTSAAAGQPH
                     QHQETAAAAADATVASVPKETQSDKEIIRIIPIVATDCVVGCEGMRTSQAVSAEDLRT
                     PTKPAGSQAPDRTPEKKSKNTQTPESAVKSHKRLEWDPAADVGYYKRAVSTSNISTLE
                     RSILEECWRQPQQRSETDLDRLQLEQGTTLAQRPPLASSTFVNRSERRTTPSLGSIRS
                     SSNQSNRSSSRRESKSQSRCTSPNGGSSVASSFDYHSSLPSAQSSSQKQLAKEEERQY
                     TAAQLEKVLAGAASRRQAKEDKENCQPAAQRGSSSSSSSTAAGTEAETGPGPAGGPKG
                     ELDLGVDLLCSLVQARSLSHKQKKHLIRDIAKRISCIELGESLRSRQSPTKAKAAAQL
                     QDMATNTTASVARPVPAPRTRILIANSSGTSTASSSKEMVTARTNPRACKAAKEPTTE
                     PQQLQLPSSEASSISHEGEATSSHSNEAVPAPLPATTTAPAETELVSQEWLNPMTQSE
                     IEYEERSRSSSNDSERRLTLSWIELEIKRLQTVYKIVNSKSFLQIVPVDDKSPTAAIE
                     YDPLISAEPLIELLPDGEGPQRRATVRARMIGAGQEQEPLLLGVQVKHVHPRGLQEKP
                     VHLQGEQEEPLRSVEQPPDEVRCITKPHADVESPAAAPELQAIPTPPPPPPPPPPRGI
                     PQRGKMATPNSSSDGGRSESVCSFVQQRQRQFMEHYQNQQQQQLQQLQQHQQLQQLQQ
                     QQQKQQKQRKQQRILPRMPHLLHHPQHQEHQHYHPLVHGHGQGHGLCVHQQEQQQQQL
                     QHMAPQHYIQMQYTQAAGSGSGMDAGGVYYTAVPHGYSLLSSDAMAEYVQVASEAAEG
                     AEERCAATTRTTTTSSSSISSMLCLSSEMSIPMGGGGVVNTSKTTTTTTTHQYDEATS
                     GSRCQRKRRDQTQKQTQTQTQRRGAHGIAYMIQFGESEMQHTMSLQDHLQLARPKFCA
                     KSKQRKAILNQMQMLRSERRRELEELLGEDCTLETLDRRLQQLPPPVTSCVRVFSTKE
                     MKAMTSKRCQRLPEVVAAQNREREERRRRSNRLMRDVFNRRMQNRVSKGKISLNHSLT
                     II"
     misc_feature    <1673..>2056
                     /gene="LOC111072447"
                     /note="Sperm equatorial segment protein 1; Region: SPESP1;
                     pfam15754"
                     /db_xref="CDD:464848"
     misc_feature    3200..3577
                     /gene="LOC111072447"
                     /note="ALMS motif; Region: ALMS_motif; pfam15309"
                     /db_xref="CDD:464634"
ORIGIN      
        1 tagccaacac tgaacggata tcagcacttt gaaacactgc ctaacaatgc acgaaaattc
       61 cgtcgcattt aaaaaaatgc aatttacatt ttaaaacaaa acaccaactg caattttgac
      121 atattagttt atattgctgc caacacacgt gagacggtgc aaaatgcctg gccaccagcg
      181 aattggcaca cacctccgca agcacacgga cgagaagcgt ctgctggcgt cgcgcgtccc
      241 tcccaaagcc agggaatacc tatccgaact ggccgtcgat cgggagctgg agcgcttcat
      301 ggccctgtcc tcgaccaata gcagtggcac cagtcgcagc aatgtgagca tgtacacggc
      361 tcccctacac tgcactcccc gttcagtgtc agtggcgcca tcaaagccag cccgctgcag
      421 tggcgggagc gggggaaaaa cgacatctgc agcagctgga caaccgcatc agcatcagga
      481 aacagctgcc gctgccgctg acgctacagt tgcgtctgtg ccaaaggaaa cacaaagcga
      541 taaggagatc atcaggatta tacccattgt agccaccgac tgcgttgtgg gctgcgaagg
      601 gatgcgcacc agtcaagccg tgtccgcgga ggatctacgc acacccacca agccagcggg
      661 cagtcaggcg ccagacagga cgcccgagaa aaagtcaaaa aatacccaaa cgcccgaatc
      721 ggccgtgaaa tcgcacaagc gccttgaatg ggacccagcc gcggatgtgg gctactacaa
      781 gcgggcggtg tccaccagca acataagcac cctggagcgt tccattctgg aggagtgctg
      841 gcggcagcca cagcagcgtt cggagaccga tttggatagg ctgcagctgg agcagggaac
      901 aacgctggca cagcggccac cgctcgcctc cagtacgttt gtgaaccgca gcgaacgcag
      961 gaccacgccc agtctgggga gcattcgcag cagcagcaat caaagcaatc gcagcagctc
     1021 caggcgagag tccaagtcgc agtcacgctg cacatcccca aatggcggca gctcggtggc
     1081 cagtagcttt gattatcact cgtcgttgcc ctctgctcag agtagctccc aaaagcagct
     1141 ggcaaaggag gaggagcgtc agtatacggc cgcgcagctg gagaaggttc tggccggggc
     1201 tgccagtcga aggcaggcga aggaggacaa agaaaactgt cagccggctg cccagagagg
     1261 tagctcctct tcttcgtcct ctactgctgc aggaactgaa gctgaaacag gaccgggccc
     1321 tgctggtggt cccaagggag agcttgactt gggcgtggat ctgctctgtt cgctggtgca
     1381 ggcccgcagt ctcagccaca agcagaagaa gcatttgata cgggacatag cgaagcgcat
     1441 ctcctgcata gaactggggg agagcctgcg ctcccgccaa agcccaacaa aggcaaaagc
     1501 tgctgcccag ctgcaggaca tggccaccaa cactactgcc agtgtggcac gtcctgtgcc
     1561 cgctccgagg acacgcattt tgatagccaa ctcctcgggc acctccacag cgagcagctc
     1621 caaggagatg gtcaccgcac ggaccaatcc acgggcctgc aaagcagcca aagaacccac
     1681 gacggaacca cagcagctgc agcttccctc ttcggaggcc agcagcatct cccatgaggg
     1741 tgaagccaca tcttcgcaca gcaatgaggc tgttcccgca ccgctacctg ctaccactac
     1801 cgctcccgcg gaaacggagc tagtgagcca ggagtggctc aatcccatga cccagagcga
     1861 gatcgagtac gaggagcgtt cgcgttcgtc cagcaacgat tcggagcgtc gcctaacgct
     1921 cagttggatc gagttggaga tcaagcggct gcagacggtg tacaagatcg tgaatagcaa
     1981 atcgttcctc cagattgttc cagttgatga caagagtccc acggctgcca tcgagtacga
     2041 tcccctgatc agtgcagagc cgttgattga gctgctgccg gatggggagg ggccacagcg
     2101 tcgagccact gttcgggcac gcatgattgg tgctggtcaa gagcaggaac cacttctgtt
     2161 gggtgtgcaa gtgaagcatg tacaccctcg gggattgcaa gagaagcctg tgcatcttca
     2221 gggagaacaa gaggagcctc taagatccgt agagcagccc ccagacgagg ttagatgcat
     2281 aacaaagcca cacgctgatg tggagtcgcc agcagcagca ccggaattac aggcgatacc
     2341 aaccccacca ccaccgccac ctccaccacc accgaggggc attccacagc gaggaaaaat
     2401 ggccacaccc aacagctcca gtgatggcgg acgcagcgaa agtgtgtgct cttttgtgca
     2461 gcagcgacag cggcagttta tggagcacta tcagaaccaa cagcagcagc agctgcaaca
     2521 gctgcaacag caccagcagc tgcagcagct gcagcagcag cagcagaaac aacagaagca
     2581 aaggaagcag cagcgtatac tgccacggat gccacatctt ctacaccatc cacagcatca
     2641 ggagcatcaa cattaccatc cactggttca tgggcatggg caggggcacg ggctgtgtgt
     2701 gcaccagcaa gagcagcagc agcagcagct gcagcatatg gcaccacagc attacattca
     2761 aatgcaatat acgcaggcag caggatcagg ctcaggaatg gacgctggtg gtgtctacta
     2821 cacagcagtg ccccacgggt acagcctttt gagcagcgat gccatggccg aatatgtgca
     2881 ggtggcatca gaagcagcag aaggcgccga agaacgctgc gccgccacca cgaggacaac
     2941 gaccaccagc agcagttcga tctcttccat gttgtgcctc agctcggaga tgtccatacc
     3001 aatggggggc ggtggagtgg taaacacctc caagacgacc accacaacca ccacgcatca
     3061 gtacgacgag gctacatcgg gcagtaggtg tcagcggaag cgcagggacc agacacagaa
     3121 gcaaacgcag acacagacac agcgcagggg agcgcatggc attgcgtata tgattcagtt
     3181 tggggagagc gaaatgcagc acacaatgtc gctgcaggat cacctgcagc tcgctcgtcc
     3241 caagttctgt gccaagtcca agcagcgcaa ggccatactc aatcaaatgc agatgctgcg
     3301 cagcgagcga cggcgcgaac tggaggagct gctcggtgag gattgcaccc tggagacact
     3361 ggacaggcgg ctgcaacagc tgccaccgcc agtcacatct tgcgttcgag ttttctccac
     3421 gaaggagatg aaggccatga ccagcaaacg atgccagcga ctgcccgagg tggtggccgc
     3481 tcagaatcgt gagcgcgagg agcgacggcg tcgcagcaat cgcctcatgc gggatgtctt
     3541 caatcggcgc atgcaaaacc gcgtgtccaa gggcaagata tccctgaacc acagcctgac
     3601 aatcatttag gaataccacc ccctcccacc cctacaagat ggagacaaca ctttgccagt
     3661 tgaaggcttg atttatgttt ttatattatc acttttaatt tttgttttcg aataaaaaac
     3721 tgttcaaatg a