PREDICTED: Drosophila obscura xenotropic and polytropic retrovirus


LOCUS       XM_041591989            2011 bp    mRNA    linear   INV 14-MAY-2021
            receptor 1 homolog (LOC111066266), mRNA.
ACCESSION   XM_041591989
VERSION     XM_041591989.1
DBLINK      BioProject: PRJNA728747
KEYWORDS    RefSeq; corrected model; includes ab initio.
SOURCE      Drosophila obscura
  ORGANISM  Drosophila obscura
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NW_024542752.1) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI
            Annotation Status           :: Full annotation
            Annotation Name             :: Drosophila obscura Annotation
                                           Release 101
            Annotation Version          :: 101
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 8.6
            Annotation Method           :: Best-placed RefSeq; Gnomon
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio            :: 1% of CDS bases
            frameshifts          :: corrected 9 indels
            internal stop codons :: corrected 1 genomic stop codons
            ##RefSeq-Attributes-END##
PRIMARY     REFSEQ_SPAN         PRIMARY_IDENTIFIER PRIMARY_SPAN        COMP
            1-7                 JAECWW010000165.1  2739945-2739951
            8-105               JAECWW010000165.1  2740134-2740231
            106-141             JAECWW010000165.1  2740321-2740356
            142-142             "N"                1-1
            143-282             JAECWW010000165.1  2740357-2740496
            283-284             "NN"               1-2
            285-383             JAECWW010000165.1  2740497-2740595
            384-483             JAECWW010000165.1  2740635-2740734
            484-509             JAECWW010000165.1  2740736-2740761
            510-855             JAECWW010000165.1  2740764-2741109
            856-885             JAECWW010000165.1  2741111-2741140
            886-1101            JAECWW010000165.1  2741142-2741357
            1102-1102           "N"                1-1
            1103-1255           JAECWW010000165.1  2741358-2741510
            1256-1478           JAECWW010000165.1  2741561-2741783
            1479-1512           JAECWW010000165.1  2741857-2741890
            1513-1551           JAECWW010000165.1  2741893-2741931
            1552-1552           "N"                1-1
            1553-1633           JAECWW010000165.1  2741932-2742012
            1634-2011           JAECWW010000165.1  2744065-2744442
FEATURES             Location/Qualifiers
     source          1..2011
                     /organism="Drosophila obscura"
                     /mol_type="mRNA"
                     /isolate="BZ-5 IFL"
                     /db_xref="taxon:7282"
                     /chromosome="Unknown"
                     /sex="male"
                     /tissue_type="whole fly"
                     /dev_stage="Adult fly"
                     /geo_loc_name="Serbia: Babin Zub"
                     /collection_date="2017"
     gene            1..2011
                     /gene="LOC111066266"
                     /note="The sequence of the model RefSeq transcript was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: inserted 5 bases in 4 codons;
                     deleted 7 bases in 5 codons; Derived by automated
                     computational analysis using gene prediction method:
                     Gnomon. Supporting evidence includes similarity to: 2
                     Proteins, and 62% coverage of the annotated genomic
                     feature by RNAseq alignments"
                     /db_xref="GeneID:111066266"
     CDS             1..1686
                     /gene="LOC111066266"
                     /note="The sequence of the model RefSeq protein was
                     modified relative to its source genomic sequence to
                     represent the inferred CDS: inserted 5 bases in 4 codons;
                     deleted 7 bases in 5 codons; substituted 1 base at 1
                     genomic stop codon"
                     /codon_start=1
                     /transl_except=(pos:1039..1041,aa:OTHER)
                     /product="LOW QUALITY PROTEIN: xenotropic and polytropic
                     retrovirus receptor 1 homolog"
                     /protein_id="XP_041447923.1"
                     /db_xref="GeneID:111066266"
                     /translation="METGTASCAACGAKAPQTFETHLTIEWRQQYLRYTALKAMIRQG
                     VDGXPHLGTASHKYGVESYYKAFEEAFCTECHNELDRVNNFFMEKLAEARXHATLKLQ
                     LLASARVPGHTSSAIALNSQRTAAADRKLMTQRQLRTVYSEFYLSLVLLQNFQSLNET
                     GSFRKICKKYQVSGVQLRRGLVRAAHSAGKPFGHYEPVPGGPFTWVIFNFFMAANVTG
                     WQRSGVNHVLIFDMDPRSHLQPATFLEIACTLGILWTLSMLGYLCHVPLHPLALILIM
                     LLLLLLVIPLPIMNWPARWTLARWTMRLMTAPLHYVGFADFWMGDQLNSLLTCLVDHY
                     YIVRFYTTCWLRXGAVPPYLTTDLMVPFMRCLPXLRRFRDSGSKSVTYLLNAGKYSTT
                     FCVVLFSTLRNRTDGTSLVPHRFPLTYGSMAASIVSTVYCYLWDVIKDFGLFRIRKGE
                     SAVLLLLNLLLRCFWVIEFTFYCHNLMTPHKARALASLLEITRRFIWNYVRLENGEYL
                     YNCGKFRATXDLAALKPRQERRLEDMMDESDRVTNRKRGSERERLGQQEKGRE"
     misc_feature    40..510
                     /gene="LOC111066266"
                     /note="SPX domain of the xenotropic and polytropic
                     retrovirus receptor 1 (XPR1) and related proteins; Region:
                     SPX_XPR1_like; cd14477"
                     /db_xref="CDD:269898"
     misc_feature    598..1524
                     /gene="LOC111066266"
                     /note="EXS family; Region: EXS; pfam03124"
                     /db_xref="CDD:460816"
ORIGIN      
        1 atggaaactg ggacggcttc ctgcgccgct tgtggggcaa aagcccccca aacctttgag
       61 acgcatctga ccatcgaatg gcgacagcag tacctgcgat atacggctct gaaggcaatg
      121 atcaggcagg gtgtggacgg tnggccgcat ctcggaaccg catcgcacaa atacggcgtc
      181 gagagctact acaaggcctt cgaggaggcc ttctgcaccg agtgccacaa cgagctggat
      241 cgcgtcaaca acttcttcat ggagaagctg gcggaggcgc gtnngcatgc caccctcaag
      301 ctgcagctgc tggcatccgc ccgggtgccc gggcatacgt ccagtgccat agcgctgaac
      361 tcacagcgaa cagcggcggc ggaccgtaag ttgatgaccc agcggcagct gcgcaccgtc
      421 tacagcgagt tctacctcag cctggtgctg ctccagaatt ttcagtcgct caacgagacg
      481 ggcagcttcc gcaagatctg taagaagtac caagtatctg gagtccaact ccggcgcgga
      541 ctggttcgag cggcacatag cgcaggcaaa ccttttggcc attatgagcc tgtaccgggg
      601 ggacccttca cctgggtcat cttcaacttc tttatggccg ccaatgtgac ggggtggcag
      661 cggtcgggcg tcaaccatgt gctgatattc gacatggatc cgcgcagcca cctgcagccg
      721 gccaccttcc tggagatcgc ctgcaccctc ggcatactgt ggacgctctc gatgctgggc
      781 tacctctgcc atgtaccgct gcatccgctg gccctgatcc tcatcatgct gctgctgctg
      841 ctgctggtga taccgctgcc gatcatgaac tggccggcac gctggacgct ggcacgctgg
      901 acgatgcgac tgatgactgc gccgctgcac tacgtgggct tcgccgactt ctggatgggc
      961 gatcagctga actcgctgct cacctgcctc gtcgatcact actacattgt gcgcttctac
     1021 accacctgct ggctgcggta gggggcggtg ccgccgtacc tcaccaccga tctgatggtg
     1081 ccgttcatgc gctgcctgcc cngcctgcgc cgattccggg acagcggctc caagtccgtc
     1141 acctatctgc tcaatgccgg gaagtactcg acgacattct gcgtggtgct cttctccacg
     1201 ctgcgcaatc gaacggatgg tacgagcctc gtcccccacc ggttcccact cacatacgga
     1261 tctatggccg cctccatagt gtccaccgtg tactgctatt tgtgggacgt gatcaaggac
     1321 tttggcctgt tccgcatccg caagggggag tccgcagtcc ttctactgct gaatctgctg
     1381 ctgcgctgct tctgggtgat cgagttcacg ttctactgcc acaacctgat gacgccccac
     1441 aaggccagag ctctggccag tctcctggag atcacgcggc gcttcatctg gaactacgtg
     1501 cgattggaga atggagagta tctgtacaac tgcggcaagt ttcgtgccac antcgatctg
     1561 gcggcgctca agccgcggca ggagcgcagg ctcgaggaca tgatggacga gtcggacagg
     1621 gtgaccaatc gcaagagggg cagcgaaaga gagaggctag gacagcagga gaaaggcaga
     1681 gaatgagcct gttgctatta ttaattgccg ctgccatcga tgctgctgct gctgctgctg
     1741 ctgctgctgt gtcaattaag ctgcaacatg agtcgagtgc agtgcaatat gcggcggctc
     1801 catgtcctct gtccgcagat tgtggccgat gtggccgatc ttggtacagt tgcacacgcg
     1861 ccaaaaccag accaaataga caaaaacaag caaacaacaa aaaggcgaag cgaaaaagca
     1921 aacaagcaaa gcgaagaaca gcccagtgga gggagcccaa cccaagccaa gtcgaatgaa
     1981 caaacaaaca aacaaatccc aatacgatac c