PREDICTED: Drosophila obscura AP-1 complex subunit beta-1


LOCUS       XM_022364237            3371 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072393), transcript variant X2, mRNA.
ACCESSION   XM_022364237
VERSION     XM_022364237.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364237.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3371
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3371
                     /gene="LOC111072393"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 4 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 15 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072393"
     CDS             138..2912
                     /gene="LOC111072393"
                     /codon_start=1
                     /product="AP-1 complex subunit beta-1"
                     /protein_id="XP_022219929.1"
                     /db_xref="GeneID:111072393"
                     /translation="MTDSKYFTTTKKGEIFELKSELNNDKKEKKKEAVKKVIASMTVG
                     KDVSALFPDVVNCMQTDNLELKKLVYLYLMNYAKSQPDMAIMAVNTFVKDCEDSNPLI
                     RALAVRTMGCIRVDKITEYLCEPLRKCLKDEDPYVRKTAAVCVAKLYDISATMVEDQG
                     FLDQLKDLLSDSNPMVVANAVAALSEINEASQSGQPLVEMNSVTINKLLTALNECTEW
                     GQVFILDSLANYSPKDEREAQSICERITPRLAHANAAVVLSAVKVLMKLLEMLSSDSD
                     FCATLTKKLAPPLVTLLSSEPEVQYVALRNINLIVQKRPDILKHEMKVFFVKYNDPIY
                     VKLEKLDIMIRLANQSNIAQVLSELKEYATEVDVDFVRKAVRAIGRCAIKVEPSAERC
                     VSTLLDLIQTKVNYVVQEAIVVIKDIFRKYPNKYESIISTLCENLDTLDEPEARASMV
                     WIIGEYAERIDNADELLDSFLEGFQDENAQVQLQLLTAVVKLFLKRPSDTQELVQHVL
                     SLATQDSDNPDLRDRGFIYWRLLSTDPAAAKEVVLADKPLISEETDLLEPTLLDELIC
                     HISSLASVYHKPPTAFVEGRGAGVRKSLPNRTAGTGVSSGAGDQQETGAGSEAMVIPN
                     QESLIGDLLSMDINAPSMPAAPTATSNVDLLGGGLDILLGGPPAEPAPGGASSLLGDI
                     FGLAGTSLSVGVQIPKVTWLPAEKGKGLEIQGTFSRRNGEVFMDMTLTNKAMQPMTNF
                     AIQLNKNSFGLSPASPLAAVPLPPNQTAEVSLALGTNGPIQRMEPLNNLQVAVKNNID
                     IFYFACLVHGNVLFAEDGQLDKRVFLNTWKEIPAANELQYSLSGVIGTTDGIASKMTT
                     NNIFTIAKRNVEGQDMLYQSLRLTNNIWVLLELKLQPGNPDATLSLKSRSVEVANIIF
                     AAYEAIIRSP"
     misc_feature    249..1742
                     /gene="LOC111072393"
                     /note="Adaptin N terminal region; Region: Adaptin_N;
                     pfam01602"
                     /db_xref="CDD:396262"
     misc_feature    288..362
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    order(336..341,348..350,357..362,447..452,459..461,
                     468..473,552..557,564..566,573..578,585..587,669..674,
                     681..683,690..695,798..803,810..812,819..824)
                     /gene="LOC111072393"
                     /note="putative peptide binding site [polypeptide
                     binding]; other site"
                     /db_xref="CDD:293787"
     misc_feature    396..479
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    498..590
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    615..695
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    726..824
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1314..1388
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1422..1511
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1530..1622
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    1653..1763
                     /gene="LOC111072393"
                     /note="HEAT repeat [structural motif]; Region: HEAT
                     repeat"
                     /db_xref="CDD:293787"
     misc_feature    2253..2543
                     /gene="LOC111072393"
                     /note="Adaptin C-terminal domain; Region: Alpha_adaptinC2;
                     smart00809"
                     /db_xref="CDD:197886"
     misc_feature    2571..2903
                     /gene="LOC111072393"
                     /note="Beta2-adaptin appendage, C-terminal sub-domain;
                     Region: B2-adapt-app_C; smart01020"
                     /db_xref="CDD:198088"
ORIGIN      
        1 acttacatgt ggacgtgtta aacggggttt atgttgactt tgaaaatttg aatttgtatt
       61 tgagacgtgt tcaagctctg tatctgtttg tgcgtcttct gaaagtccta gctagttcgt
      121 agagcagaac tgacaagatg accgattcaa agtatttcac aaccaccaaa aagggcgaaa
      181 tcttcgagct caagtccgag ctgaacaatg acaagaagga gaagaagaag gaggctgtga
      241 agaaggtgat tgccagcatg accgtcggca aagatgtgtc cgccctcttt cccgatgtcg
      301 tgaactgcat gcagaccgat aatctggagc tcaagaagct ggtctacttg tatctgatga
      361 actacgccaa gtcgcagccg gacatggcca tcatggcggt gaatacattc gtgaaggact
      421 gcgaggactc caatccattg atccgtgccc tggccgtgcg taccatgggc tgcataagag
      481 tggataagat aaccgagtat ctgtgcgagc cgctgcgcaa gtgtctgaag gatgaggatc
      541 cctatgtgcg caaaacggcg gctgtgtgcg tggcgaagct gtacgacata tcggccacca
      601 tggtggagga ccagggcttt ctcgatcagc tgaaggacct gctgtccgac tccaatccga
      661 tggtcgtggc caatgcggtg gctgccctca gcgaaatcaa cgaggccagc cagtcgggac
      721 agccgctggt agagatgaac tcggtgacca tcaacaagct gctgacggcc ctcaacgagt
      781 gcacagagtg gggacaggtc ttcatccttg actccctggc caactacagc cccaaagatg
      841 agcgggaggc gcagtcaatc tgtgagcgaa tcacgcctcg tttagcccat gcgaacgctg
      901 ccgtggttct cagtgccgtc aaggtgctga tgaaacttct cgagatgctc tccagtgaca
      961 gcgacttttg tgccacgctc accaagaagc tggccccgcc cctggtgacc ctgctttcct
     1021 cggagccaga ggtacaatat gtggccctgc gcaacattaa tcttattgtc cagaagcgtc
     1081 ccgacatcct caaacatgag atgaaggtgt tctttgtgaa gtacaacgat cccatctacg
     1141 tgaagttgga gaaattggac attatgatcc gtctggccaa ccagagcaac attgcccagg
     1201 tgctcagcga actgaaggag tacgccaccg aagtggatgt cgattttgtg cggaaggcag
     1261 tgcgcgccat cggtcgttgt gccatcaaag tggagccatc ggcagagcgc tgtgtctcca
     1321 ctctgctcga tctcatccag accaaggtca attatgtggt gcaggaggca attgttgtca
     1381 ttaaagacat cttccgcaag tatcccaata agtacgagag cattatcagc accttgtgcg
     1441 agaatctgga caccctggat gagccggagg cgcgtgcctc gatggtctgg atcattggcg
     1501 agtacgccga gcgcattgat aacgcagacg agctgctcga cagcttcctt gagggcttcc
     1561 aggatgagaa tgcccaagtg cagctgcagt tgctcactgc tgtggtgaag ctcttcctta
     1621 agcgtccatc ggatacccaa gagctcgtgc agcacgtcct ctcgctggcc actcaggatt
     1681 cggacaatcc cgatttgcgc gaccgtggat tcatctactg gcgtctactc tccacggacc
     1741 cggccgccgc caaggaagtt gtgttggcgg acaagcctct catctcggag gaaacggatc
     1801 tgctggagcc gacgctgctg gacgagctca tctgtcacat cagctcgctg gccagcgtgt
     1861 accacaagcc accaacggcc tttgtggagg gacgaggagc tggcgtgcgt aagtctctgc
     1921 caaaccgcac tgccggaacc ggcgtgagca gcggtgcagg agatcagcaa gagacgggag
     1981 ccggttcgga ggctatggtc atacccaacc aagaatcgct tattggggat ttgctgtcca
     2041 tggacatcaa tgccccctct atgcccgctg ccccaaccgc cacaagcaac gtggatctgc
     2101 taggcggtgg cctggacata ctgctgggtg gcccaccagc tgaaccagca ccgggcggcg
     2161 cctccagcct gctgggcgac atctttggcc tggccggcac ctccctttct gtgggcgttc
     2221 aaattccgaa agtcacgtgg ctgccagcgg agaagggcaa gggcctggag atccagggca
     2281 ccttctcccg ccgcaacggt gaagtcttca tggacatgac gctcaccaac aaagccatgc
     2341 agccgatgac gaactttgcc atccagctga acaagaacag ctttggcctg tcgccagcct
     2401 caccgctggc ggcggtgccc ttgccaccca accagacggc cgaggtgagc ctcgccctgg
     2461 gcaccaacgg acccatccag cgcatggagc cgctgaacaa ccttcaggtg gcggtgaaga
     2521 acaacattga catcttctat ttcgcctgcc tggtgcacgg caacgtgctg ttcgctgagg
     2581 acggccagct ggacaagcgg gtcttcctga acacctggaa ggagataccg gccgccaacg
     2641 agctgcagta cagcctgagc ggcgtcatcg gaaccactga cggcatcgcc tccaagatga
     2701 ccaccaacaa catcttcacc attgccaagc gcaatgtcga gggccaagac atgctctatc
     2761 agtcgctgag gctgacgaac aacatctggg tgttgctgga actaaagctg cagccgggca
     2821 accctgatgc cacgctcagc ctcaagtcac gatccgtgga ggtggccaat atcattttcg
     2881 ccgcctacga ggccatcatt cgctcgcctt aaactccaaa cacaaatcga aataagatac
     2941 ccatgagcca cagaatcgtt tcttaatgtt ttctgtaggt gttatacctt atagcagata
     3001 caacaagcaa attgtagtct acgtactata ttataactac tattattgca ttgtgcgtat
     3061 attgggagtt gcgaattgtt ccatgcacct acatatatac ctatatacaa aacattaata
     3121 cgtgcataca tacacacacc atatgtaata ctaatcctaa tgaataacgc gagaagaaga
     3181 aatgttaatt gttattaaac gttgcatgct ccgtagaaat ccaattcaat cgatgccgga
     3241 gcatcggatg ttagtcgcat tccaaaatct ataatataac cgcccccaat gcatgcatct
     3301 atgtatatgt atgtatgtgt gtcctagtaa aaatgtatga catataacgc actaaataat
     3361 cgaaacattg a