ID HQ158011; SV 1; circular; genomic DNA; STD; VRL; 2753 BP. XX AC HQ158011; XX DT 27-APR-2012 (Rel. 112, Created) DT 27-APR-2012 (Rel. 112, Last updated, Version 1) XX DE Cotton leaf curl virus isolate Sirsa-Haryana segment DNA-A, complete DE sequence. XX KW . XX OS Cotton leaf curl virus OC Viruses; Geminiviridae; Begomovirus; unclassified Begomovirus. XX RN [1] RP 1-2753 RA Chakrabarty P.K., Sable S.V., Kalbande B.B., Chavhan R.L., Monga D., RA Koundal V., Kumar D., Pappu H.R.; RT ; RL Submitted (18-AUG-2010) to the INSDC. RL Division of Crop Improvement, Central Institute for Cotton Research, Post RL Bag No. 2, Shankar Nagar, P.O., Nagpur, Maharashtra 440010, India XX DR MD5; 0b335b8e1812dc9d67de46ba8b37a09b. XX FH Key Location/Qualifiers FH FT source 1..2753 FT /organism="Cotton leaf curl virus" FT /segment="DNA-A" FT /host="Gossypium hirsutum" FT /isolate="Sirsa-Haryana" FT /serotype="UC" FT /mol_type="genomic DNA" FT /country="India" FT /collected_by="P.K. Chakrabarty, Suchitra Sable and Dilip FT Monga" FT /collection_date="Aug-2006" FT /db_xref="taxon:53010" FT gene complement(75..806) FT /gene="AC5" FT CDS complement(75..806) FT /codon_start=1 FT /gene="AC5" FT /product="ac5 protein" FT /db_xref="InterPro:IPR006892" FT /db_xref="InterPro:IPR013671" FT /db_xref="UniProtKB/TrEMBL:I1SZG6" FT /protein_id="AEI52884.1" FT /translation="MNILHSRRTGLIIKHIKYLSKILRFINRSTISNQEKHHTIRVILR FT LNVLIHPYLTQHINRLDTKSLTNSMGQPSTTSNITNTHYFTYMLNIMSGLKRLNLTWTF FT TSSRNIWTSVHPVHPGLPVQRPVCPCLLFCDADNGGSSTAGVWAAEVQTPAYFRRGRRN FT DDIGSSLRHNYGSVKYKLNPVLTRTQAYPVNNPATKVANISQKAYTETREPYQGIRLIV FT DPTCLNLKLSAQVLIVCGSVI" FT gene 131..487 FT /gene="AV2" FT CDS 131..487 FT /codon_start=1 FT /gene="AV2" FT /product="precoat/movement protein" FT /db_xref="GOA:I1SZG0" FT /db_xref="InterPro:IPR002511" FT /db_xref="InterPro:IPR005159" FT /db_xref="UniProtKB/TrEMBL:I1SZG0" FT /protein_id="AEI52878.1" FT /translation="MWDPLLNEFPDTVHGFRCMLSVKYLQLLSQDYSPDTLGYELIRDL FT ICILRSRNYVEASCRYRHFYARVESTPASELRQPIHQPCCCPHCPRHKTTGMDKQAFEQ FT EAQDVQDVQKSRCS" FT gene 291..1061 FT /gene="AV1" FT CDS 291..1061 FT /codon_start=1 FT /gene="AV1" FT /product="coat protein" FT /db_xref="GOA:I1SZG1" FT /db_xref="InterPro:IPR000263" FT /db_xref="InterPro:IPR000650" FT /db_xref="UniProtKB/TrEMBL:I1SZG1" FT /protein_id="AEI52879.1" FT /translation="MSKRAADIVISTPASKVRRRLNFGSPYTSRAAAPIVRVTKQQAWT FT NRPLNRKPRMYRMYRSPDVPRGCEGPCKVQSFESRHDIQHIGKVMCISDVTRGTGLTHR FT VGKRFCVKSVYVLGKIWMDENIKTKNHTNSVMFFLVRDRRPVDKPQDFGEVFNMFDNEP FT STATVKNVHRDRYQVLRKWYATVTGGQYASKEQALVKKFVRVNNYVVYNQQEAGKYENH FT TENALMLYMACTHASNPVYATLKIRIYFYDSVTN" FT gene complement(1064..1468) FT /gene="AC3" FT CDS complement(1064..1468) FT /codon_start=1 FT /gene="AC3" FT /product="replication enhancer protein" FT /note="ren" FT /db_xref="GOA:I1SZG2" FT /db_xref="InterPro:IPR000657" FT /db_xref="UniProtKB/TrEMBL:I1SZG2" FT /protein_id="AEI52880.1" FT /translation="MDSRTGEPITAAQAGNGAYIWEVPNPLYFKIISHVNRPFTTNMDI FT LTIRIQFNYNTRKALGLHKCFLTFRIWTTLQPQTGLFLRVFKTQVLKYLNNLGVISINL FT VIKAVEHVLYNVIQQTMYVDQYSEIKFKLH" FT gene complement(1161..1613) FT /gene="AC2" FT CDS complement(1161..1613) FT /codon_start=1 FT /gene="AC2" FT /product="transcription activator protein" FT /db_xref="GOA:I1SZG3" FT /db_xref="InterPro:IPR000942" FT /db_xref="UniProtKB/TrEMBL:I1SZG3" FT /protein_id="AEI52881.1" FT /translation="MRPSSHRIGPCTQVPIKVQHREAKRRNRRRRVDLECGCSYYLSIN FT CHNHGFTHRGTHHCSSSREWRIYLGGSKSPLFQDHQPRQPSIHDEYGHTHDQDPVQLQH FT SESSGTAQVFSNIPNLDDLTASDWSFLKGIQNPSPQISEQSRCNFN" FT gene complement(1510..2598) FT /gene="AC1" FT CDS complement(1510..2598) FT /codon_start=1 FT /gene="AC1" FT /product="replication initiator protein" FT /db_xref="GOA:I1SZG4" FT /db_xref="InterPro:IPR001191" FT /db_xref="InterPro:IPR001301" FT /db_xref="InterPro:IPR022690" FT /db_xref="UniProtKB/TrEMBL:I1SZG4" FT /protein_id="AEI52882.1" FT /translation="MPPKRNGFYSKNYFITYPKCSLTKEEALSQLLNIQTPTSKKYIRI FT CRELHEDGTPHLHVLIQFEGKFKCQNMRFFDLVSPSRSAHFHPNIQGAKSSSDVKSYIE FT KDGDILDWGQFQIDGRSARGGHQACNGSALQRKKVGSKSEILRVIKELALEDHVLRFHN FT LNAKLDRKFQETPSTYITQASFLYFNQVTEERALQIIESLINVAPLVNSVIMLAYDGTS FT RGGKARAATSLGPYNSPCGHLVWNPRVEEDEKENIRTRVAPTQILKHFKEFMGAHKARP FT SGAKSGKPVRAKGGIPAIILGNPGPNSSYKEFLDEEKNSALKNWALKNATFITQDRPMY FT SGTNQSTAQGSEEAQQEEESRS" FT gene complement(2142..2444) FT /gene="AC4" FT CDS complement(2142..2444) FT /codon_start=1 FT /gene="AC4" FT /product="ac4 protein" FT /db_xref="InterPro:IPR002488" FT /db_xref="UniProtKB/TrEMBL:I1SZG5" FT /protein_id="AEI52883.1" FT /translation="MGLLTCMFSSSSKGNSSARICDSSTWSPQAGQHISIRTYRELNPA FT PTSNPTSRRTGTFSTGGNFRSTEGQQEEGIKHAMALHCSGRKWEVSRKFLESLRN" XX SQ Sequence 2753 BP; 717 A; 571 C; 618 G; 847 T; 0 other; accggatggc cgcgcgattt ttttgtgggc cttaccatta acacttgtcg gccaatcata 60 tgactccctc aaagctaaat aacgctcccg cacactataa gtacttgcgc actaagtttc 120 aaattcaaac atgtgggatc cactattaaa cgaattccct gatacggttc acgggtttcg 180 gtgtatgctt tctgtgaaat atttgcaact tttgtcgcag gattattcac cggatacgct 240 tgggtacgag ttaatacggg atttaatttg tattttacgc tcccgtaatt atgtcgaagc 300 gagctgccga tatcgtcatt tctacgcccg cgtcgaaagt acgccggcgt ctgaacttcg 360 gcagcccata caccagccgt gctgctgccc ccattgtccg cgtcacaaaa caacaggcat 420 ggacaaacag gcctttgaac aggaagccca ggatgtacag gatgtacaga agtccagatg 480 ttcctagagg atgtgaaggt ccatgtaagg ttcagtcgtt tgagtccaga catgatattc 540 agcatatagg taaagtaatg tgtattagtg atgttactcg tggtactggg ctgacccata 600 gagttggtaa gagattttgt gtcaagtctg tttatgtgtt gggtaagata tggatggatg 660 agaacattaa gacgaagaat cacacgaata gtgtgatgtt tttcttggtt agagatcgta 720 gacctgttga taaacctcaa gattttggag aggtatttaa tatgtttgat aatgagccca 780 gtacggcgac tgtgaagaat gttcatcgtg ataggtatca agttctgcgc aaatggtatg 840 caactgtcac cggtggacaa tacgcttcaa aggaacaggc tttggtcaag aagtttgtca 900 gagttaacaa ttatgttgtt tacaatcaac aggaagcagg aaaatacgag aatcatacgg 960 aaaatgcgtt aatgctttat atggcttgta ctcacgctag caaccctgtt tatgctacgt 1020 tgaagattag gatatatttt tatgactctg taacgaattg atattaatga agtttgaatt 1080 ttatttctga atattgatct acatacatag tttgttggat tacattgtac aatacatgtt 1140 ctacagcttt aataactaaa ttaattgaaa ttacaccgag attgttcaga tatttgagga 1200 cttgggtttt gaataccctt aagaaaagac cagtctgagg ctgtaaggtc gtccagattc 1260 ggaatgttag aaaacacttg tgcagtccca gagctttccg agtgttgtag ttgaactgga 1320 tcctgatcgt gagtatgtcc atattcgtcg tgaatggacg gttgacgtgg ctgatgatct 1380 tgaaataaag gggatttgga acctcccaga tatatgcgcc attccctgct tgagctgcag 1440 tgatgggttc ccctgtgcgt gaatccatgg ttgtggcagt tgattgacag ataataagaa 1500 cacccgcatt caagatctac tctcctcctc ctgttgcgcc tcttcgcttc cctgtgctgt 1560 actttgattg gtacctgagt acatgggcct atcctgtgtg atgaaggtcg cattctttaa 1620 cgcccaattt tttagtgcag aattcttctc ttcatccaaa aactctttat agcttgaatt 1680 gggtcctgga ttgccaagga ttatagcggg aattccgcct ttagctcgaa ctggcttccc 1740 ggattttgca cctgatggcc ttgccttgtg ggcccccatg aactccttaa agtgctttag 1800 aatctgcgtt ggagccaccc gcgtccttat attctccttt tcatcttctt ctacccttgg 1860 gttccaaact agatgtccac atgggctgtt atatggacct aatgatgtgg ctgccctcgc 1920 cttccccccc ctactggtac cgtcatacgc taacattatg acgctattga ccaggggagc 1980 gacattgata aggctctcaa ttatctgcag tgcacgttct tctgtgacct gattgaaata 2040 aagaaaggac gcctgagtaa tatacgtaga tggcgtctcc tgaaattttc tgtctagctt 2100 tgcatttaaa ttgtgaaatc gcaatacgtg atcctcaaga gctagttcct taatgactct 2160 aagaatttcc gacttacttc ccactttctt ccgctgcaat gcagagccat tgcatgcttg 2220 atgccctcct cttgctgacc ttccgtcgat ctgaaattgc ccccagtcga gaatgtcccc 2280 gtccttctcg atgtaggatt tgacgtcgga gctggattta gctccctgta tgttcggatg 2340 gaaatgtgct gacctgcttg gggagaccaa gtcgaagaat cgcatattct ggcacttgaa 2400 tttcccttcg aactggatga gaacatgcaa gtgaggagtc ccatcttcgt gaagctctct 2460 gcagattcta atatattttt ttgaagttgg ggtttgtata tttaataatt gggaaagtgc 2520 ttcctctttg gtgagagaac atttgggata agtgatgaaa tagtttttgg aataaaaacc 2580 gttccgcttt ggaggcatgt tgactaaaat tgatcaccga ttgaccgctc ttgcaactct 2640 ccctggtata tcggtgatca atatatagtg atcaccaaat ggcataatgg taataaaaaa 2700 actttaattt gaaattcaaa ccaaaaggct aaagcggcca tccgtttaat att 2753 //