PREDICTED: Drosophila obscura uncharacterized LOC111072424


LOCUS       XM_022364275            3242 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111072424), mRNA.
ACCESSION   XM_022364275
VERSION     XM_022364275.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022364275.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3242
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3242
                     /gene="LOC111072424"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 2 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 14 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111072424"
     CDS             226..3108
                     /gene="LOC111072424"
                     /codon_start=1
                     /product="uncharacterized protein LOC111072424"
                     /protein_id="XP_022219967.2"
                     /db_xref="GeneID:111072424"
                     /translation="MFLAVNQSLHNASKKKKKRRSIQQDEDETGSSSTANSSEAKPPR
                     RLESAASSDQLVGDRAASGGANKAVTSLVLVYIYLGALTLILASLAIVFYTHTQQDSD
                     AAPTQSNSRLFRAQFQAELQRSEDVLRAMLSRIAEADHERETGTASTTRKMARGSGEV
                     KNERKFTDNLIDGHAPRATEEQRMRMRIRRDVVSSPASMHALAADPLIEFFNPNHRMA
                     LEEQDTEIRKRTGQKGAAPGGDEWIYLNTYCRVPEKIITGFCKGTQDYCPPAPVGPPG
                     ESGPKGLTGNPGLPGIPGPKGNRGDVGLPGAPGVDGVGHVGPAGPRGPKGDAGGVGRS
                     GLDGRDGVPGEPGLDGVPGRAGADGKNGQSGRDGKDGLHGKDGKDGLSITGPKGAQGP
                     PGERGLKGIAGPRGRPGKPGTNGTPGVPGINAWKMQFPNGSSSNDLLIPPSITDLHAP
                     DFHRTVIVEEGRSLNLSCTATGSPQPQVEWRREDGRTINVNGMEMASISGQFLKFTNI
                     TRHQMAAYTCYANNGIAPVANATFIVEVHFAPMISVYRQMIYAEYQSTATLECLVEAF
                     PEAIRYWERAYDGKILDPSEKYSIESYPDGFKTSMRLTVNNLRKDDFGYYHCVARNEL
                     NATMVNFEIAPQDPNSETPYVGNSIKVYGQRPPESECPVCDQCPDPSLYQCKDSILNN
                     FEIQPTGNLSYPGLPKRPKTCYLYAVGKPVFHKVVNEKFGAWLRDPAPESDREKTFVT
                     NENDPYNLFEFTTRIQYRMNSVPRRKYEIPEGFHGNAHVVFNGSFYYHQRNSDLVVKL
                     DLTSLKKITTQLPYAGVAASNRLYATDFNFMDFNVDEVGLWVIYSTYNSNNTLVAKLD
                     AETLKMQYNFNITLDHHQFGEMFIVCGNLYAIDSATDKNTQIRYVVDLYKGKLLNTNL
                     PFSNPFSHTTTVGYNPLTVELYSWDKGNALTYPIRYNEQRLISDNS"
     misc_feature    <1027..>1485
                     /gene="LOC111072424"
                     /note="LPXTG-anchored collagen-like adhesin Scl2/SclB;
                     Region: gly_rich_SclB; NF038329"
                     /db_xref="CDD:468478"
     misc_feature    1588..1833
                     /gene="LOC111072424"
                     /note="Immunoglobulin domain; Region: Ig; cl11960"
                     /db_xref="CDD:472250"
     misc_feature    1615..1629
                     /gene="LOC111072424"
                     /note="Ig strand B [structural motif]; Region: Ig strand
                     B"
                     /db_xref="CDD:409562"
     misc_feature    1654..1668
                     /gene="LOC111072424"
                     /note="Ig strand C [structural motif]; Region: Ig strand
                     C"
                     /db_xref="CDD:409562"
     misc_feature    1726..1740
                     /gene="LOC111072424"
                     /note="Ig strand E [structural motif]; Region: Ig strand
                     E"
                     /db_xref="CDD:409562"
     misc_feature    1768..1785
                     /gene="LOC111072424"
                     /note="Ig strand F [structural motif]; Region: Ig strand
                     F"
                     /db_xref="CDD:409562"
     misc_feature    1810..1821
                     /gene="LOC111072424"
                     /note="Ig strand G [structural motif]; Region: Ig strand
                     G"
                     /db_xref="CDD:409562"
     misc_feature    1843..2091
                     /gene="LOC111072424"
                     /note="Immunoglobulin domain; Region: Ig_3; pfam13927"
                     /db_xref="CDD:464046"
     misc_feature    2338..3075
                     /gene="LOC111072424"
                     /note="Olfactomedin-like domain; Region: OLF; pfam02191"
                     /db_xref="CDD:460482"
ORIGIN      
        1 gccaacgcgt ttggtcacca gctctctctc tctctctcac tctctttctc tgtcttttct
       61 tcaatatctt tctcccattc acacttacgc tctcacattc acgctctctc cgcgcctccc
      121 atttgtcgct gccccatgcg gaaaagtgtg aaaaagtttt agtagcaagc agcggctcgg
      181 ctcttatgta tacaccagcc gcacggacac cacagcggct gcaacatgtt cttggccgtc
      241 aaccagagtc tgcacaatgc cagcaagaag aagaagaagc gacgctccat tcagcaggat
      301 gaggacgaga ccggctcgtc cagcacagcc aacagcagtg aggcgaagcc accgcggcgc
      361 ctggagtcag cggcctccag tgaccaactg gtgggggaca gggccgcgtc tggcggtgcc
      421 aacaaggcgg ttacctccct ggtgctcgtc tacatctatt tgggtgccct caccctgatc
      481 ctggccagcc tggccatcgt cttttacacg cacacacagc aggatagcga cgcggcgcca
      541 acgcagagca actcgaggct ctttcgcgca cagttccagg cggagttgca gcgatccgag
      601 gatgtcctgc gagcgatgct cagccggata gccgaagcgg atcatgagcg ggaaacgggc
      661 accgccagca ccacgcgaaa gatggccaga ggcagcggcg aggtgaagaa cgagcgcaag
      721 ttcacggaca acctgatcga tgggcacgcc ccgcgtgcga cggaggagca gcgaatgcga
      781 atgcggatac ggcgggacgt tgtctcgtcg ccggcctcga tgcacgcact tgcagctgat
      841 ccactgatcg agttcttcaa tccgaaccac cgcatggcgc tcgaggagca ggacactgag
      901 atccgcaagc ggacaggcca gaagggtgcc gcgcccggcg gcgacgagtg gatctatctg
      961 aacacctact gccgcgtgcc cgagaagatt atcacgggct tctgcaaggg cacccaggac
     1021 tactgtccgc cggcgccggt gggcccgccg ggcgagtccg gccccaaggg cctaaccggc
     1081 aatcccggcc tgcccggcat acccggcccc aagggcaatc gcggcgatgt cggcctgccc
     1141 ggcgcacccg gcgtcgatgg tgtcggccat gtggggccgg ctggtccgcg tgggcccaag
     1201 ggcgatgcgg gcggcgtcgg acggtcgggc ctggacgggc gcgacggtgt gcccggcgag
     1261 ccgggcctgg atggcgtacc ggggcgagcg ggcgccgatg gcaagaacgg gcagtcggga
     1321 cgcgacggca aggatgggct gcatggcaag gacggcaagg atgggctgtc cataacgggg
     1381 ccgaagggcg cccagggccc gcccggcgaa cgtggactca agggcattgc gggtccgcgc
     1441 ggtcgtcccg gcaagccggg caccaacggc acgcccggcg tgcccggcat caatgcatgg
     1501 aagatgcagt tccccaatgg cagctcctcg aacgatctgc tgataccgcc ctcgatcacg
     1561 gatctgcatg cgccggactt ccatcgcacg gtgattgtcg aggagggtcg atccctgaat
     1621 ctcagctgca cggccaccgg cagtccccag ccgcaggtgg agtggcgccg cgaggacggc
     1681 cgcaccatca acgtcaatgg catggagatg gcctccatca gcggacagtt tctgaagttc
     1741 accaacatca cgcggcacca gatggcggcc tacacgtgct acgccaacaa tgggattgca
     1801 cccgtcgcca atgcgacctt cattgtggaa gttcactttg ctcccatgat ctcggtgtac
     1861 cgacaaatga tctacgcgga gtaccagagc acggccacgc tggagtgcct ggtggaggcc
     1921 ttccccgagg ccatacgcta ctgggagcgg gcctacgatg gcaagatact ggatcccagc
     1981 gagaagtaca gcattgaatc gtatccagat ggtttcaaaa cttcgatgcg gctgaccgtt
     2041 aataatctgc gcaaggacga ctttggctac taccactgtg tggcacgcaa cgagctgaat
     2101 gccaccatgg tcaactttga gatagcgcca caagatccga acagtgagac gccctatgtg
     2161 ggcaacagca tcaaggtgta tggccagcga ccgccggaga gcgagtgtcc cgtctgtgat
     2221 cagtgtccgg acccaagcct gtaccagtgc aaggattcca tactgaacaa ctttgagatc
     2281 cagccgacag gcaatctcag ctatccgggg ctgcccaagc gacccaagac ctgctatctg
     2341 tatgcggtgg gcaagcccgt gttccacaag gtcgttaacg agaagtttgg cgcctggctg
     2401 cgcgacccgg cgcccgagag cgatcgggag aagacgttcg tcacgaacga gaatgatccg
     2461 tacaatctgt ttgagttcac cacgcggata cagtaccgca tgaacagtgt gcccaggcgc
     2521 aagtacgaga tacccgaggg ctttcatggc aacgctcatg tggtgttcaa tggctcgttc
     2581 tactatcacc agcggaactc cgatctggtg gttaaactgg atctgacaag cctcaagaaa
     2641 atcaccacac aattgccgta cgcgggcgtg gcagcctcca accgactcta cgcaacggac
     2701 ttcaatttta tggacttcaa tgtggacgag gtgggtctgt gggtcatcta cagcacctac
     2761 aactccaaca acacgctggt ggcaaagttg gatgcggaga ccctgaagat gcagtacaac
     2821 tttaatatca cactggacca tcatcagttc ggggagatgt tcattgtgtg cggcaatctg
     2881 tatgccatcg attcggccac cgataagaat acgcagatcc gatatgtcgt cgatctgtac
     2941 aagggcaagc tgctcaatac gaatctgccg ttctcgaatc ccttcagcca caccaccacc
     3001 gttggctaca atcccctcac agtggaactc tactcgtggg acaagggcaa cgccctcaca
     3061 tatcccatac gctacaatga gcagcgcctc atctccgaca acagctagga gcgagagcca
     3121 tagatcactt aactaccata tgcccgggct cccaagggat ctggccacag ctcaaatcta
     3181 atatagattc taaggcacac aaacacaaac aataaataaa tgagaattgt ttttttttcc
     3241 aa