PREDICTED: Drosophila obscura AP-1 complex subunit beta-1


LOCUS       XM_022364236            3347 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072393), transcript variant X1, mRNA.
ACCESSION   XM_022364236
VERSION     XM_022364236.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364236.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3347
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3347
                     /gene="LOC111072393"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 17 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072393"
     CDS             114..2888
                     /gene="LOC111072393"
                     /codon_start=1
                     /product="AP-1 complex subunit beta-1"
                     /protein_id="XP_022219928.1"
                     /db_xref="GeneID:111072393"
                     /translation="MTDSKYFTTTKKGEIFELKSELNNDKKEKKKEAVKKVIASMTVG
                     KDVSALFPDVVNCMQTDNLELKKLVYLYLMNYAKSQPDMAIMAVNTFVKDCEDSNPLI
                     RALAVRTMGCIRVDKITEYLCEPLRKCLKDEDPYVRKTAAVCVAKLYDISATMVEDQG
                     FLDQLKDLLSDSNPMVVANAVAALSEINEASQSGQPLVEMNSVTINKLLTALNECTEW
                     GQVFILDSLANYSPKDEREAQSICERITPRLAHANAAVVLSAVKVLMKLLEMLSSDSD
                     FCATLTKKLAPPLVTLLSSEPEVQYVALRNINLIVQKRPDILKHEMKVFFVKYNDPIY
                     VKLEKLDIMIRLANQSNIAQVLSELKEYATEVDVDFVRKAVRAIGRCAIKVEPSAERC
                     VSTLLDLIQTKVNYVVQEAIVVIKDIFRKYPNKYESIISTLCENLDTLDEPEARASMV
                     WIIGEYAERIDNADELLDSFLEGFQDENAQVQLQLLTAVVKLFLKRPSDTQELVQHVL
                     SLATQDSDNPDLRDRGFIYWRLLSTDPAAAKEVVLADKPLISEETDLLEPTLLDELIC
                     HISSLASVYHKPPTAFVEGRGAGVRKSLPNRTAGTGVSSGAGDQQETGAGSEAMVIPN
                     QESLIGDLLSMDINAPSMPAAPTATSNVDLLGGGLDILLGGPPAEPAPGGASSLLGDI
                     FGLAGTSLSVGVQIPKVTWLPAEKGKGLEIQGTFSRRNGEVFMDMTLTNKAMQPMTNF
                     AIQLNKNSFGLSPASPLAAVPLPPNQTAEVSLALGTNGPIQRMEPLNNLQVAVKNNID
                     IFYFACLVHGNVLFAEDGQLDKRVFLNTWKEIPAANELQYSLSGVIGTTDGIASKMTT
                     NNIFTIAKRNVEGQDMLYQSLRLTNNIWVLLELKLQPGNPDATLSLKSRSVEVANIIF
                     AAYEAIIRSP"
     misc_feature    225..1718
                     /gene="LOC111072393"
                     /note="Adaptin N terminal region; Region: Adaptin_N;
                     pfam01602"
                     /db_xref="CDD:396262"
     misc_feature    264..338
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    order(312..317,324..326,333..338,423..428,435..437,
                     444..449,528..533,540..542,549..554,561..563,645..650,
                     657..659,666..671,774..779,786..788,795..800)
                     /gene="LOC111072393"
                     /note="putative peptide binding site [polypeptide
                     binding]; other site"
                     /db_xref="CDD:293787"
     misc_feature    372..455
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    474..566
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    591..671
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    702..800
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1290..1364
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1398..1487
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1506..1598
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1629..1739
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    2229..2519
                     /gene="LOC111072393"
                     /note="Adaptin C-terminal domain; Region: Alpha_adaptinC2;
                     smart00809"
                     /db_xref="CDD:197886"
     misc_feature    2547..2879
                     /gene="LOC111072393"
                     /note="Beta2-adaptin appendage, C-terminal sub-domain;
                     Region: B2-adapt-app_C; smart01020"
                     /db_xref="CDD:198088"
ORIGIN      
        1 ctgaaggtga ggcggtattt tataaatccg cggtcactct aattaatttt ttgtgcccga
       61 aaaaacgaat tttacagaaa gtcctagcta gttcgtagag cagaactgac aagatgaccg
      121 attcaaagta tttcacaacc accaaaaagg gcgaaatctt cgagctcaag tccgagctga
      181 acaatgacaa gaaggagaag aagaaggagg ctgtgaagaa ggtgattgcc agcatgaccg
      241 tcggcaaaga tgtgtccgcc ctctttcccg atgtcgtgaa ctgcatgcag accgataatc
      301 tggagctcaa gaagctggtc tacttgtatc tgatgaacta cgccaagtcg cagccggaca
      361 tggccatcat ggcggtgaat acattcgtga aggactgcga ggactccaat ccattgatcc
      421 gtgccctggc cgtgcgtacc atgggctgca taagagtgga taagataacc gagtatctgt
      481 gcgagccgct gcgcaagtgt ctgaaggatg aggatcccta tgtgcgcaaa acggcggctg
      541 tgtgcgtggc gaagctgtac gacatatcgg ccaccatggt ggaggaccag ggctttctcg
      601 atcagctgaa ggacctgctg tccgactcca atccgatggt cgtggccaat gcggtggctg
      661 ccctcagcga aatcaacgag gccagccagt cgggacagcc gctggtagag atgaactcgg
      721 tgaccatcaa caagctgctg acggccctca acgagtgcac agagtgggga caggtcttca
      781 tccttgactc cctggccaac tacagcccca aagatgagcg ggaggcgcag tcaatctgtg
      841 agcgaatcac gcctcgttta gcccatgcga acgctgccgt ggttctcagt gccgtcaagg
      901 tgctgatgaa acttctcgag atgctctcca gtgacagcga cttttgtgcc acgctcacca
      961 agaagctggc cccgcccctg gtgaccctgc tttcctcgga gccagaggta caatatgtgg
     1021 ccctgcgcaa cattaatctt attgtccaga agcgtcccga catcctcaaa catgagatga
     1081 aggtgttctt tgtgaagtac aacgatccca tctacgtgaa gttggagaaa ttggacatta
     1141 tgatccgtct ggccaaccag agcaacattg cccaggtgct cagcgaactg aaggagtacg
     1201 ccaccgaagt ggatgtcgat tttgtgcgga aggcagtgcg cgccatcggt cgttgtgcca
     1261 tcaaagtgga gccatcggca gagcgctgtg tctccactct gctcgatctc atccagacca
     1321 aggtcaatta tgtggtgcag gaggcaattg ttgtcattaa agacatcttc cgcaagtatc
     1381 ccaataagta cgagagcatt atcagcacct tgtgcgagaa tctggacacc ctggatgagc
     1441 cggaggcgcg tgcctcgatg gtctggatca ttggcgagta cgccgagcgc attgataacg
     1501 cagacgagct gctcgacagc ttccttgagg gcttccagga tgagaatgcc caagtgcagc
     1561 tgcagttgct cactgctgtg gtgaagctct tccttaagcg tccatcggat acccaagagc
     1621 tcgtgcagca cgtcctctcg ctggccactc aggattcgga caatcccgat ttgcgcgacc
     1681 gtggattcat ctactggcgt ctactctcca cggacccggc cgccgccaag gaagttgtgt
     1741 tggcggacaa gcctctcatc tcggaggaaa cggatctgct ggagccgacg ctgctggacg
     1801 agctcatctg tcacatcagc tcgctggcca gcgtgtacca caagccacca acggcctttg
     1861 tggagggacg aggagctggc gtgcgtaagt ctctgccaaa ccgcactgcc ggaaccggcg
     1921 tgagcagcgg tgcaggagat cagcaagaga cgggagccgg ttcggaggct atggtcatac
     1981 ccaaccaaga atcgcttatt ggggatttgc tgtccatgga catcaatgcc ccctctatgc
     2041 ccgctgcccc aaccgccaca agcaacgtgg atctgctagg cggtggcctg gacatactgc
     2101 tgggtggccc accagctgaa ccagcaccgg gcggcgcctc cagcctgctg ggcgacatct
     2161 ttggcctggc cggcacctcc ctttctgtgg gcgttcaaat tccgaaagtc acgtggctgc
     2221 cagcggagaa gggcaagggc ctggagatcc agggcacctt ctcccgccgc aacggtgaag
     2281 tcttcatgga catgacgctc accaacaaag ccatgcagcc gatgacgaac tttgccatcc
     2341 agctgaacaa gaacagcttt ggcctgtcgc cagcctcacc gctggcggcg gtgcccttgc
     2401 cacccaacca gacggccgag gtgagcctcg ccctgggcac caacggaccc atccagcgca
     2461 tggagccgct gaacaacctt caggtggcgg tgaagaacaa cattgacatc ttctatttcg
     2521 cctgcctggt gcacggcaac gtgctgttcg ctgaggacgg ccagctggac aagcgggtct
     2581 tcctgaacac ctggaaggag ataccggccg ccaacgagct gcagtacagc ctgagcggcg
     2641 tcatcggaac cactgacggc atcgcctcca agatgaccac caacaacatc ttcaccattg
     2701 ccaagcgcaa tgtcgagggc caagacatgc tctatcagtc gctgaggctg acgaacaaca
     2761 tctgggtgtt gctggaacta aagctgcagc cgggcaaccc tgatgccacg ctcagcctca
     2821 agtcacgatc cgtggaggtg gccaatatca ttttcgccgc ctacgaggcc atcattcgct
     2881 cgccttaaac tccaaacaca aatcgaaata agatacccat gagccacaga atcgtttctt
     2941 aatgttttct gtaggtgtta taccttatag cagatacaac aagcaaattg tagtctacgt
     3001 actatattat aactactatt attgcattgt gcgtatattg ggagttgcga attgttccat
     3061 gcacctacat atatacctat atacaaaaca ttaatacgtg catacataca cacaccatat
     3121 gtaatactaa tcctaatgaa taacgcgaga agaagaaatg ttaattgtta ttaaacgttg
     3181 catgctccgt agaaatccaa ttcaatcgat gccggagcat cggatgttag tcgcattcca
     3241 aaatctataa tataaccgcc cccaatgcat gcatctatgt atatgtatgt atgtgtgtcc
     3301 tagtaaaaat gtatgacata taacgcacta aataatcgaa acattga