ID   JX898689; SV 1; circular; genomic DNA; STD; VRL; 3182 BP.
XX
AC   JX898689;
XX
DT   19-DEC-2012 (Rel. 115, Created)
DT   19-DEC-2012 (Rel. 115, Last updated, Version 1)
XX
DE   Hepatitis B virus isolate P29, complete genome.
XX
KW   .
XX
OS   Hepatitis B virus
OC   Viruses; Hepadnaviridae; Orthohepadnavirus.
XX
RN   [1]
RP   1-3182
RA   Alestig E.;
RT   "Genetic diversity of genotype D3 in acute hepatitis B";
RL   Unpublished.
XX
RN   [2]
RP   1-3182
RA   Alestig E.;
RT   ;
RL   Submitted (01-OCT-2012) to the INSDC.
RL   Infectious Diseases, University of Gothenburg, Guldhedsgatan 10B,
RL   Gothenburg 41346, Sweden
XX
DR   MD5; e9017ddcaffd29e3b2e26d016a7ea6a5.
XX
CC   ##Assembly-Data-START##
CC   Assembly Method       :: Lasergene v. 8
CC   Sequencing Technology :: Sanger dideoxy sequencing
CC   ##Assembly-Data-END##
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..3182
FT                   /organism="Hepatitis B virus"
FT                   /host="Homo sapiens"
FT                   /isolate="P29"
FT                   /mol_type="genomic DNA"
FT                   /country="Sweden"
FT                   /collection_date="1986"
FT                   /note="genotype: D3"
FT                   /db_xref="taxon:10407"
FT   gene            join(2307..3182,1..1623)
FT                   /gene="P"
FT   CDS             join(2307..3182,1..1623)
FT                   /codon_start=1
FT                   /gene="P"
FT                   /product="polymerase"
FT                   /db_xref="GOA:L0CN97"
FT                   /db_xref="InterPro:IPR000201"
FT                   /db_xref="InterPro:IPR000477"
FT                   /db_xref="InterPro:IPR001462"
FT                   /db_xref="InterPro:IPR037531"
FT                   /db_xref="UniProtKB/TrEMBL:L0CN97"
FT                   /protein_id="AGA16760.1"
FT                   /translation="MPLSYQHFRKLLLLDDEAGPLEEELPRLADEGLNRRVAEDLNLGN
FT                   LNVSIPWTHKVGNFTGLYSSTVPVFNPHWKTPSFPNIHLHQDIIKKCEQFVGPLTINEK
FT                   RRLQLIMPARFYPKVTKYLPLDKGIKPYYPEHLVNHYFQTRHYLHTLWKAGILYKRETT
FT                   HSASFCGSPYSWEQDLQHGAESFHQQSSGILSRPPVGSSLQSKHRKSRLGLQSQQGHLA
FT                   RRQQGRSWSIRAGFHPTARRPFGVEPSGSGHTTNFASKSASCLHQSPDRKAAYPAVSTF
FT                   EKHSSSGHAVEFHNLSPNSARSQSERPVFPCWWLQFRSSKPCSDYCLSLIVNLLEDWGP
FT                   CAEHGEHHIRIPRTPSRVTGGVFLVDKNPHNTAESRLVVDFSQFSRGNYRVSWPKFAVP
FT                   NLQSLTNLLSSNLSWLSLDVSAAFYHLPLHPAAMPHLLVGSSGLSRYVARLSSNSRILN
FT                   HQHGTMPNLHDYCSRNLYVSLLLLYQTFGRKLHLYSHPIILGFRKIPMGVGLSPFLLAQ
FT                   FTSAICSVVRRAFPHCLAFSYMDDVVLGAKSVQHLESLFTAVTNFLLSLGIHLNPNKTK
FT                   RWGYSLNFMGYVIGSYGSLPQEHIIQKIKECFRKLPINRPIDWKVCQRIVGLLGFAAPF
FT                   TQCGYPALMPLYACIQSKQAFTFSPTYKAFLCKQYLNLYPVARQRPGLCQVFADATPTG
FT                   WGLVMGHQRMRGTFSAPLPIHTAELLAACFARSRSGANIIGTDNSVVLSRKYTSYPWLL
FT                   GCAANWILRGTSFVYVPSALNPADDPSRGRLGLSRPLLRLPFRPTTGRTSLYADSPSVP
FT                   SHLPDRVHFASPLHVAWRPP"
FT   gene            join(2848..3182,1..835)
FT                   /gene="S"
FT   CDS             join(2848..3182,1..835)
FT                   /codon_start=1
FT                   /gene="S"
FT                   /product="large S protein"
FT                   /note="pre-S1/pre-S2/S"
FT                   /db_xref="GOA:L0CLC1"
FT                   /db_xref="InterPro:IPR000349"
FT                   /db_xref="UniProtKB/TrEMBL:L0CLC1"
FT                   /protein_id="AGA16761.1"
FT                   /translation="MGQNLSTSNPLGFFPDHQLDPAFRANTANPDWDFNPNKDTWPDAS
FT                   KVGAGAFGLGFTPPHGGLLGWSPQAQGILQTLPANPPPASTNRQTGRQPTPLSPPLRNT
FT                   HPQAMQWNSTTFHQTLQDPRVRGLYFPAGGSSSGAVNPVPTTASPLSSIFSRIGDPALN
FT                   MESITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGTTVCLGQNSQSPTSN
FT                   HSPTSCPPTCPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGMLPVCPLIPGSSTTST
FT                   GPCRTCMTTAQGTSMYPSCCCTKPSDGNCTCIPIPSSWAFGKFLWEWASARFSWLSLLV
FT                   PFVQWFVGLSPTVWLSVIWMMWYWGPSLYSILSPFLPLLPIFFCLWVYI"
FT   CDS             join(3172..3182,1..835)
FT                   /codon_start=1
FT                   /gene="S"
FT                   /product="middle S protein"
FT                   /note="pre-S2/S"
FT                   /db_xref="GOA:B5TF55"
FT                   /db_xref="InterPro:IPR000349"
FT                   /db_xref="UniProtKB/TrEMBL:B5TF55"
FT                   /protein_id="AGA16762.1"
FT                   /translation="MQWNSTTFHQTLQDPRVRGLYFPAGGSSSGAVNPVPTTASPLSSI
FT                   FSRIGDPALNMESITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGTTVCL
FT                   GQNSQSPTSNHSPTSCPPTCPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGMLPVCP
FT                   LIPGSSTTSTGPCRTCMTTAQGTSMYPSCCCTKPSDGNCTCIPIPSSWAFGKFLWEWAS
FT                   ARFSWLSLLVPFVQWFVGLSPTVWLSVIWMMWYWGPSLYSILSPFLPLLPIFFCLWVYI
FT                   "
FT   CDS             155..835
FT                   /codon_start=1
FT                   /gene="S"
FT                   /product="S protein"
FT                   /note="HBsAg"
FT                   /db_xref="GOA:Q2PWG5"
FT                   /db_xref="InterPro:IPR000349"
FT                   /db_xref="UniProtKB/TrEMBL:Q2PWG5"
FT                   /protein_id="AGA16763.1"
FT                   /translation="MESITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGT
FT                   TVCLGQNSQSPTSNHSPTSCPPTCPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGML
FT                   PVCPLIPGSSTTSTGPCRTCMTTAQGTSMYPSCCCTKPSDGNCTCIPIPSSWAFGKFLW
FT                   EWASARFSWLSLLVPFVQWFVGLSPTVWLSVIWMMWYWGPSLYSILSPFLPLLPIFFCL
FT                   WVYI"
FT   gene            1374..1838
FT                   /gene="X"
FT   CDS             1374..1838
FT                   /codon_start=1
FT                   /gene="X"
FT                   /product="X peptide"
FT                   /db_xref="GOA:O11883"
FT                   /db_xref="InterPro:IPR000236"
FT                   /db_xref="UniProtKB/TrEMBL:O11883"
FT                   /protein_id="AGA16764.1"
FT                   /translation="MAARLCCQLDPARDVLCLRPVGAESCGRPFSGSLGTLSSPSPSAV
FT                   PTDHGAHLSLRGLPVCAFSSAGPCALRFTSARRMETTVNAHRMLPKVLHKRTLGLSAMS
FT                   TTDLEAYFKDCLFKDWEELGEEIRLKVFVLGGCRHKLVCAPAPCNFFTSA"
FT   gene            1814..2452
FT                   /gene="C"
FT   CDS             1814..2452
FT                   /codon_start=1
FT                   /gene="C"
FT                   /product="precore/core protein"
FT                   /db_xref="GOA:Q89656"
FT                   /db_xref="InterPro:IPR002006"
FT                   /db_xref="InterPro:IPR013195"
FT                   /db_xref="InterPro:IPR036459"
FT                   /db_xref="UniProtKB/TrEMBL:Q89656"
FT                   /protein_id="AGA16765.1"
FT                   /translation="MQLFHLCLIISCSCPTVQASKLCLGWLWGMDIDPYKEFGATVELL
FT                   SFLPSDFFPSVRDLLDTASALYREALESPEHCSPHHTALRQAILCWGELMTLATWVGVN
FT                   LEDPASRDLVVSYVNTNMGLKFRQLLWFHISCLTFGRETVIEYLVSFGVWIRTPPAYRP
FT                   PNAPILSTLPETTVVRRRGRSPRRRTPSPRRRRSQSPRRRRSQSRESQC"
FT   CDS             1901..2452
FT                   /codon_start=1
FT                   /gene="C"
FT                   /product="core protein"
FT                   /db_xref="GOA:Q778I9"
FT                   /db_xref="InterPro:IPR002006"
FT                   /db_xref="InterPro:IPR036459"
FT                   /db_xref="UniProtKB/TrEMBL:Q778I9"
FT                   /protein_id="AGA16766.1"
FT                   /translation="MDIDPYKEFGATVELLSFLPSDFFPSVRDLLDTASALYREALESP
FT                   EHCSPHHTALRQAILCWGELMTLATWVGVNLEDPASRDLVVSYVNTNMGLKFRQLLWFH
FT                   ISCLTFGRETVIEYLVSFGVWIRTPPAYRPPNAPILSTLPETTVVRRRGRSPRRRTPSP
FT                   RRRRSQSPRRRRSQSRESQC"
XX
SQ   Sequence 3182 BP; 729 A; 855 C; 692 G; 906 T; 0 other;
     ttccacaacc tttcaccaaa ctctgcaaga tcccagagtg agaggcctgt atttccctgc        60
     tggtggctcc agttcaggag cagtaaaccc tgttccgact actgcctctc ccttatcgtc       120
     aatcttctcg aggattgggg accctgcgct gaacatggag agcatcacat caggattcct       180
     aggacccctt ctcgtgttac aggcggggtt tttcttgttg acaagaatcc tcacaatacc       240
     gcagagtcta gactcgtggt ggacttctct caattttcta gggggaacta ccgtgtgtct       300
     tggccaaaat tcgcagtccc caacctccaa tcactcacca acctcctgtc ctccaacttg       360
     tcctggttat cgctggatgt gtctgcggcg ttttatcatc ttcctcttca tcctgctgct       420
     atgcctcatc ttcttgttgg ttcttctgga ctatcaaggt atgttgcccg tttgtcctct       480
     aattccagga tcctcaacca ccagcacggg accatgccga acctgcatga ctactgctca       540
     aggaacctct atgtatccct cctgttgctg taccaaacct tcggacggaa attgcacctg       600
     tattcccatc ccatcatcct gggctttcgg aaaattccta tgggagtggg cctcagcccg       660
     tttctcctgg ctcagtttac tagtgccatt tgttcagtgg ttcgtagggc tttcccccac       720
     tgtttggctt tcagttatat ggatgatgtg gtattggggg ccaagtctgt acagcatctt       780
     gagtcccttt ttaccgctgt taccaatttt cttttgtctt tgggtataca tttaaaccct       840
     aacaaaacaa agagatgggg ttactctctg aattttatgg gttatgtcat tggaagttat       900
     gggtccttgc cacaagaaca catcatacaa aaaatcaaag aatgttttag aaaacttcct       960
     attaacaggc ctattgattg gaaagtatgt caacgaattg tgggtctttt gggctttgct      1020
     gcccctttta cacaatgtgg ttatcctgcg ttaatgccct tgtatgcatg tattcaatct      1080
     aagcaggctt tcactttctc gccaacttac aaggcctttc tgtgtaaaca atacctgaac      1140
     ctttaccccg ttgcccggca acggccaggt ctgtgccaag tgtttgctga cgcaaccccc      1200
     actggctggg gcttggtcat gggccatcag cgcatgcgtg gaaccttttc ggctcctctg      1260
     ccgatccata ctgcggaact cctagccgct tgttttgctc gcagcaggtc tggagcaaac      1320
     attatcggga ctgataactc tgttgtcctc tcccgcaaat atacatcgta tccatggctg      1380
     ctaggctgtg ctgccaactg gatcctgcgc gggacgtcct ttgtttacgt cccgtcggcg      1440
     ctgaatcctg cggacgaccc ttctcggggt cgcttgggac tctctcgtcc ccttctccgt      1500
     ctgccgttcc gaccgaccac ggggcgcacc tctctttacg cggactcccc gtctgtgcct      1560
     tctcatctgc cggaccgtgt gcacttcgct tcacctctgc acgtcgcatg gagaccaccg      1620
     tgaacgccca ccgaatgttg cccaaggtct tacataagag gactcttgga ctctctgcaa      1680
     tgtcaacgac cgaccttgag gcatacttca aagactgttt gtttaaagac tgggaggagt      1740
     tgggggagga gattaggtta aaggtctttg tactaggagg ctgtaggcat aaattggtct      1800
     gcgcaccagc accatgcaac tttttcacct ctgcctaatc atctcttgtt catgtcctac      1860
     tgttcaagcc tccaagctgt gccttgggtg gctttggggc atggacatcg acccttataa      1920
     agaatttgga gctactgtgg agttactctc gtttttgcct tctgacttct ttccttcagt      1980
     acgagatctt ctagataccg cctcagctct gtatcgggaa gccttagagt ctcctgagca      2040
     ttgttcacct caccatactg cactcaggca agcaattctt tgctgggggg aactaatgac      2100
     tctagctacc tgggtgggtg ttaatttgga agatccagca tctagagacc tagtagtcag      2160
     ttatgtcaac actaatatgg gcctaaagtt caggcaactc ttgtggtttc acatttcttg      2220
     tctcactttt ggaagagaaa ccgttataga gtatttggtg tctttcggag tgtggattcg      2280
     cactcctcca gcttatagac caccaaatgc ccctatccta tcaacacttc cggaaactac      2340
     tgttgttaga cgacgaggca ggtcccctag aagaagaact ccctcgcctc gcagacgaag      2400
     gtctcaatcg ccgcgtcgca gaagatctca atctcgggaa tctcaatgtt agtattcctt      2460
     ggactcataa ggtggggaac tttactggtc tttattcttc tactgtacct gtctttaatc      2520
     ctcattggaa aacaccatct tttcctaata tacatttaca ccaagacatt atcaaaaaat      2580
     gtgaacagtt tgtaggccca cttacaatta atgagaaaag aagattgcaa ttgattatgc      2640
     ctgctaggtt ttatccaaag gttaccaaat atttaccatt ggataagggt attaaacctt      2700
     attatccaga acatctagtt aatcattact tccaaactag acactattta cacactctat      2760
     ggaaggcggg tatattatat aagagagaaa caacacatag cgcctcattt tgtgggtcac      2820
     catattcttg ggaacaagat ctacagcatg gggcagaatc tttccaccag caatcctctg      2880
     ggattctttc ccgaccacca gttggatcca gccttcagag caaacaccgc aaatccagat      2940
     tgggacttca atcccaacaa ggacacctgg ccagacgcca gcaaggtagg agctggagca      3000
     ttcgggctgg gtttcacccc accgcacgga ggccttttgg ggtggagccc tcaggctcag      3060
     ggcatactac aaactttgcc agcaaatccg cctcctgcct ccaccaatcg ccagacagga      3120
     aggcagccta ccccgctgtc tccacctttg agaaacactc atcctcaggc catgcagtgg      3180
     aa                                                                     3182
//