PREDICTED: Drosophila obscura homeobox protein vnd (LOC111066351),


LOCUS       XM_022354877            3014 bp    mRNA    linear   INV 14-MAY-2021
            mRNA.
ACCESSION   XM_022354877
VERSION     XM_022354877.2
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            On May 14, 2021 this sequence version replaced XM_022354877.1.
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..3014
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..3014
                     /gene="LOC111066351"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Gnomon. Supporting evidence
                     includes similarity to: 2 Proteins, and 100% coverage of
                     the annotated genomic feature by RNAseq alignments,
                     including 10 samples with support for all annotated
                     introns"
                     /db_xref="GeneID:111066351"
     CDS             897..2696
                     /gene="LOC111066351"
                     /codon_start=1
                     /product="homeobox protein vnd"
                     /protein_id="XP_022210569.2"
                     /db_xref="GeneID:111066351"
                     /translation="MSNYNPNCGYFEDCSYYTNNVYQQDYCMQPDYEYNKHVYDLFDA
                     KVPSSQRSGFHISDILNLDGSDLKNAAAAAAAAAAAQHSSELSHAAEASNGHGPATLS
                     PTPTSAAALEEHGAGSGHGEHHTTEHHPQQPHHPPQHPHHHQPHPQHHQQQHPHPHPN
                     PHPQHHQQTIAPPLPLSHHQSSAAAAAAAAASAGVASDHHVGAHAHAAAHLLASHNAA
                     AAAAVAAGQYLPKNFAGTFGDEMSSYHHMAQTMLQHSGRSAWIKENELYGTQQPASPD
                     STSPVTSEVSYTYIGSNCQTSPALSGDYKNYSRSADSDALSVGDAMHSIHGGANSGGP
                     SAAHALHNNNNNNNNNSTSNNNNNNHSLKHDHPINGAGGGGGGASSGHDDSLNEDGIE
                     EDIDDVDDADGSGGGGSGGLNSDGLPNKKRKRRVLFTKAQTYELERRFRQQRYLSAPE
                     REHLASLIRLTPTQVKIWFQNHRYKTKRAQNEKGYEHPGLLHGHATHPHHPSALPSPR
                     RVAVPVLVRNGKPCLGDGSKLAPDCVSVSSATATAMQNAAAAHHLVALNGAAYQHAAA
                     AAAAGLHAHAHAHAQAHAHVHPHAHAQRAAWWP"
     misc_feature    2160..2330
                     /gene="LOC111066351"
                     /note="Region: Homeodomain; pfam00046"
                     /db_xref="CDD:459649"
ORIGIN      
        1 agctgtccca gtcccagtcc cacttcccag ttcttcgtcc gtgtgtgtgt atgtggatca
       61 tcgtgcagca agagcttctg gcctcagggg tcccttcatt ggcagtacga cattgtcagt
      121 gggtaccatt cgacgtggaa cgcatcgaat gccgatcgcc agcttcgtgt cgcgtcgcgt
      181 ttgccagagc gagagctttc acagccatcg agtgagtgcc agagcgggaa agcgagagcg
      241 catgcgcatc tgcatctgca ttggtcatag taacggacag gcgaacaggc ggacactcag
      301 acagcggaca gcagacagcg gaaagcggac agattgtttt agctgattgc gagtggcagc
      361 gtttttatgg cttattgaaa tcggcaaacg gcagtcaaaa agcgcgcgct ccgcagccca
      421 caactcggag agaccacctc ccactcgaga ccgtaaactg ttaaccgtaa accatcgacc
      481 gtaaatccag actctttcgg caccgataga gttggcaaaa atgtagctct cgatcgaagt
      541 gcaattgaat aataaatcaa agttcgcgcc acagcttaat ggttgtacga gtacacacaa
      601 attataaagt gatcgtgcat taaaaaccga tcgacaacca catacaatac gtgcatatgt
      661 ataggccact ccaggcacat cagcatttac ccccaagccc ccacatcggc tgtcatcgcg
      721 aagtgcaaat aattaaccgt cgcgagctta caaaattaat tcattaaatg tgccactgac
      781 tacacaattt ttttgcaatt attttatcgt ttctgtttcc tttcggctga gttttggttt
      841 tgttccgatt atcctcctgg cggcaggcag cacgcgagag ccccctaaca ataattatga
      901 gcaattataa tccgaattgc ggttacttcg aggattgcag ctactacacg aacaatgtgt
      961 accaacagga ttattgcatg cagccggatt acgagtacaa caagcatgta tacgatttgt
     1021 ttgatgccaa agtgccgtcg tcgcagcgct ccggcttcca tatatcggac atcctcaacc
     1081 tggatggctc cgatctgaag aatgccgccg ccgctgctgc tgccgctgct gctgcccagc
     1141 acagcagcga gctgagccac gcggcggaag ccagcaatgg ccatggccca gcaacgctct
     1201 cgccgacgcc caccagtgcg gcggcgctgg aggagcatgg cgctgggtcc ggacacggcg
     1261 agcaccacac cacagagcac catccccagc agccgcacca cccgccgcag catccgcatc
     1321 accatcagcc gcatccccag caccaccagc aacagcatcc gcatccgcat ccgaatccgc
     1381 atccgcagca ccaccagcaa acgatagccc cacccttgcc actgtcgcac caccagagca
     1441 gtgcggctgc tgctgctgct gccgccgcca gtgcgggagt tgcatccgat caccacgtgg
     1501 gcgcccacgc ccatgccgcc gcccacctgc tggccagtca caatgcggcg gccgccgctg
     1561 ccgttgccgc cgggcagtat ctgcccaaga atttcgcagg caccttcggg gacgagatgt
     1621 cctcctacca ccacatggcc cagacaatgc tccaacactc gggacgtagc gcgtggatca
     1681 aagaaaacga attatacggc acacagcagc cggccagtcc tgatagcacc tcgccggtca
     1741 catcggaggt ctcctacacg tacatcggct ccaattgcca aacctcgccc gccctctccg
     1801 gcgactacaa gaactacagt cggtcggcgg acagtgatgc cctctcggtg ggcgatgcca
     1861 tgcacagcat ccatggcggt gccaattctg gtggaccctc ggcggcacat gccctacaca
     1921 acaacaataa caacaacaac aacaatagca ccagcaacaa caacaacaac aatcacagcc
     1981 tgaaacacga tcaccccatc aatggagctg gtggcggagg cggaggagca agcagcgggc
     2041 acgatgacag cctcaacgag gatggcatcg aggaggacat cgacgatgtg gacgatgcgg
     2101 atggcagcgg tggcggcggc agtggcggcc tcaatagcga cggactgccc aacaagaagc
     2161 gcaagcgccg cgtgctcttc accaaggcgc agacctacga gctggagcga cgattccgac
     2221 agcagcgata cctgagcgca ccggagcgcg agcatctggc cagcctcatt cgtctgacgc
     2281 cgacgcaggt gaagatctgg ttccagaatc accgctacaa gacgaagcgg gcacagaacg
     2341 aaaagggata cgagcatccg gggctgctgc atggccacgc cacccacccg caccatccgt
     2401 cggccctgcc atcgccaagg cgcgtcgccg tgcccgtgct ggtgcgcaac ggcaagccgt
     2461 gcctcggcga cggctccaag ctggcgcccg actgtgtctc cgtgagctca gcgacggcca
     2521 cggccatgca gaatgcggcc gccgcccacc acctggtggc gctgaatggg gccgcctatc
     2581 agcatgcggc tgctgcggcc gccgctggac tccatgcaca tgcccatgcc catgcgcagg
     2641 cccatgccca cgttcatcca catgcgcatg cgcagcgtgc cgcctggtgg ccctaatact
     2701 gctagatacg gagaggctga gcgagagtca gtggcagtgg cagtggcaga gggtgtggta
     2761 tggaggtatg gaggacactc gaatagtcga cactggagct gggaattcga acaaaacttt
     2821 ggtgcaataa tggaacataa tggaaccttg tcacagccgg ctcgccaggc caacccgccc
     2881 caccccccag aaaaaagaga accgaatcga agagaagcga aggagaagca gccaaaaact
     2941 aaatatgtgg aaaaagaaga gcatagtcaa agtagaagcc tctgtcaatc ctgtacataa
     3001 gtcagacaaa ggta