PREDICTED: Drosophila obscura cell wall protein DAN4


LOCUS       XM_041591947            1743 bp    mRNA    linear   INV 14-MAY-2021
            (LOC111070724), mRNA.
ACCESSION   XM_041591947
VERSION     XM_041591947.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..1743
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..1743
                     /gene="LOC111070724"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 3 Proteins, and 97% coverage of
                     the annotated genomic feature by RNAseq alignments"
                     /db_xref="GeneID:111070724"
     CDS             9..1694
                     /gene="LOC111070724"
                     /codon_start=1
                     /product="cell wall protein DAN4"
                     /protein_id="XP_041447881.1"
                     /db_xref="GeneID:111070724"
                     /translation="MMFAIACFALVLPALTLSQGYSEGYFPSRQYHHEPTVDQQYDYG
                     SCGGRVCASNGYRYANFANICRLNDYNLRLVFAGHAEFVEVDPIYCHQPPRDVGYYYR
                     PQPAPESHRPGYSPHVPCIPMTRPHIGPQHIAQSASAFAFSGYSSPAIPFWFYKPAMS
                     PTRPPADSKIYWYQAPHTSKRPVTYYYPTTSTESSTTSTTNDPSTTTTESSTTSTTND
                     PSTTTSSESSTTSTTNDPSTTTTESSTTSTTNDPSTTSESSTTTNLPSTSTTNDPSTT
                     TATTEFSTTSTTNDPSTTTSSESSTTSTTNDPSTTTTESSTTSTTNDPSTTSESSTTS
                     TTNDPSTTTNSESSTTSTTNDPSTTTATTEFSTTSTTNDPSTTTTSESSMTSTTNDPS
                     TTTNSESSTTSTTNDPSTTSESSTTSTTNDPSTTATSESSTTSTTNDPSTTTTTESST
                     MSTTNDPSTTATSESSTTTNTNVRSAVLRTELNSAVDPVTIQITGPNGKSVRLVLSDL
                     EAGGSTCTDAYTLDVTRGSTVLFQFTGCADANTAPWIKPSYLFYHTSTSVVQT"
ORIGIN      
        1 cattcagaat gatgtttgcc attgcctgct ttgccttggt gctgccagca ctgaccctct
       61 cacagggcta ctcggagggg tattttccga gcagacaata ccatcacgag ccaacagtcg
      121 accagcagta cgactacgga tcctgcgggg gccgtgtttg cgcctccaat gggtatcgct
      181 acgccaactt cgccaatatc tgccgcctga acgactacaa tttgaggctt gtgtttgctg
      241 gccatgcaga atttgtcgaa gtggatccga tatactgcca tcagccccca agagatgtgg
      301 gatactacta cagaccgcaa ccagcacccg aatcgcaccg accaggctat tcgccgcacg
      361 tgccctgcat tcccatgacc cggccccaca tcggacccca acacatcgct cagtcagcaa
      421 gtgcttttgc tttcagtgga tattcttcgc ctgctattcc gttctggttt tacaagcctg
      481 cgatgtctcc cacaaggccc ccagctgaca gcaaaattta ttggtatcag gcgccccata
      541 cgagcaagcg acctgtaacc tactattacc caacaacatc caccgaatct tcaacgacga
      601 gtaccaccaa cgacccttca acaacaacca ccgaatcttc aacgacgagt accaccaatg
      661 acccttcaac aacaacaagc agcgaatctt ctacgacgag taccaccaat gacccttcaa
      721 caacaaccac cgaatcttca acgacgagta ccaccaacga cccttcaaca accagcgaat
      781 cttctacgac gacgaatctt ccatcaacga gtaccaccaa tgacccttca acaacaacag
      841 caaccaccga attttcaacg acgagtacca ccaatgaccc ttcaacaaca acaagcagcg
      901 aatcttctac gacgagtacc accaatgacc cttcaacaac aaccaccgaa tcttcaacga
      961 cgagtaccac caacgaccct tcaacaacca gcgaatcttc tacgacgagt accaccaatg
     1021 acccttcaac aacaacaaac agcgaatctt ccacgacgag taccaccaat gacccttcaa
     1081 caacaacagc aaccaccgaa ttttcaacga cgagtaccac caatgaccct tcaacaacaa
     1141 caaccagcga atcttctatg acaagtacca ccaatgaccc ttcaacaaca acaaacagcg
     1201 aatcttctac gacgagtacc accaatgacc cttcaacaac cagcgaatct tctacgacga
     1261 gtaccaccaa tgacccttca acaacagcaa ccagcgaatc ttctacgacg agtaccacca
     1321 atgacccttc aacaacaaca accaccgaat cttcaacgat gagtaccacc aatgaccctt
     1381 caacaacagc aaccagcgaa tcttctacga cgactaacac aaatgttcgc tctgcggttt
     1441 tacgcacaga actcaactct gctgtggatc cggttaccat acagatcaca ggtccgaacg
     1501 ggaaatccgt gcgcctcgtc ctctccgacc tggaagctgg aggaagcaca tgcactgatg
     1561 cgtacaccct ggacgtgacc aggggatcga cggtgttatt tcagtttact ggttgcgcgg
     1621 atgcaaacac agccccgtgg atcaagccgt catacctttt ctaccataca tccaccagcg
     1681 ttgtccaaac ctgatgacgc tcattcacaa atactccgaa aaatctatta ctgaacaata
     1741 aat