From d3678f7a09414dd7ef7818406051883e1f07b6b2 Mon Sep 17 00:00:00 2001 From: Vitaliy Mysak Date: Mon, 18 Sep 2023 12:15:29 -0700 Subject: [PATCH] include subtype positions to orfs.csv --- intact/intact.py | 16 +- tests/expected-results-large-csv/orfs.csv | 904 +++++----- tests/expected-results-large/orfs.json | 1804 +++++++++++++++----- tests/expected-results-single-csv/orfs.csv | 24 +- tests/expected-results-single/orfs.json | 44 +- tests/expected-results-small-csv/orfs.csv | 112 +- tests/expected-results-small/orfs.json | 220 ++- 7 files changed, 2082 insertions(+), 1042 deletions(-) diff --git a/intact/intact.py b/intact/intact.py index 044ad11..d95268a 100644 --- a/intact/intact.py +++ b/intact/intact.py @@ -82,6 +82,8 @@ class CandidateORF: name: str start: int end: int + subtype_start: int + subtype_end: int orientation: str distance: float protein: str @@ -90,9 +92,11 @@ class CandidateORF: @dataclass class FoundORF: name: str - orientation: str start: int end: int + subtype_start: int + subtype_end: int + orientation: str distance: str protein: str aminoacids: str @@ -568,8 +572,8 @@ def find_candidate_positions(e, q_start, q_end): closest_start = min(n, (closest_start_a * 3) + frame) closest_end = min(n + 1, (closest_end_a * 3) + 3 + frame) got_protein = get_biggest_protein(has_start_codon(e), got_aminoacids) - yield CandidateORF(e.name, closest_start, closest_end, "forward", - dist, got_protein, got_aminoacids) + yield CandidateORF(e.name, closest_start, closest_end, e.start, e.end, + "forward", dist, got_protein, got_aminoacids) def find_real_correspondence(e): q_start = coordinates_mapping[e.start] @@ -730,7 +734,7 @@ def __enter__(self, *args): self.errors = {} elif self.fmt == "csv": self.orfs_writer = csv.writer(self.orfs_file) - self.orfs_header = ['seqid'] + [field.name for field in dataclasses.fields(CandidateORF)] + self.orfs_header = ['seqid'] + [field.name for field in dataclasses.fields(FoundORF)] self.orfs_writer.writerow(self.orfs_header) self.holistic_writer = csv.writer(self.holistic_file) self.holistic_header = ['seqid'] + [field.name for field in dataclasses.fields(HolisticInfo)] @@ -900,9 +904,11 @@ def intact( working_dir, hxb2_found_orfs = [FoundORF( o.name, - o.orientation, o.start, o.end, + o.subtype_start, + o.subtype_end, + o.orientation, o.distance, str(o.protein), str(o.aminoacids), diff --git a/tests/expected-results-large-csv/orfs.csv b/tests/expected-results-large-csv/orfs.csv index 9bf4483..c309c8f 100644 --- a/tests/expected-results-large-csv/orfs.csv +++ b/tests/expected-results-large-csv/orfs.csv @@ -1,452 +1,452 @@ -seqid,name,start,end,orientation,distance,protein,aminoacids -KX505501.1,env,0,1824,forward,1.9898364485981306,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,gag,336,1824,forward,0.3622000000000025,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,vif,1306,1927,forward,2.1463541666666663,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,nef,1306,1927,forward,2.1430894308943085,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,pol,1628,1748,forward,2.1349950149551358,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN* -KX505501.1,tat_exon2,1746,1824,forward,2.12,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,vpu,1747,1927,forward,2.098780487804878,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,rev_exon2,1747,1927,forward,1.9802197802197803,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,vpr,1748,1751,forward,2.1884615384615382,M,M -KX505501.1,tat_exon1,1748,1751,forward,2.1875,M,M -KX505501.1,rev_exon1,1748,1751,forward,2.1653846153846152,M,M -MN691959,gag,639,2142,forward,0.05400000000000005,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ* -MN691959,pol,1934,4946,forward,0.03589232303090717,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MN691959,vif,4890,5469,forward,0.0625,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH* -MN691959,vpr,5408,5702,forward,0.21153846153845945,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T -MN691959,tat_exon1,5679,5895,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ -MN691959,rev_exon1,5818,5896,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKFLYQSS,MAGRSGDSDEDLLKTVRLIKFLYQSS -MN691959,vpu,5910,6156,forward,0.7060975609756097,SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL* -MN691959,env,6070,8683,forward,0.0867990654205606,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK* -MN691959,tat_exon2,8237,8333,forward,0.19999999999999996,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD** -MN691959,rev_exon2,8238,8514,forward,0.16483516483516492,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE* -MN691959,nef,8657,9278,forward,0.16991869918698432,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC* -MN692074,env,2,4115,forward,1.9582943925233647,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,gag,789,2292,forward,0.13880000000000003,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ* -MN692074,pol,2084,4115,forward,0.7912263210369039,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,vif,3617,4115,forward,1.9968750000000002,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,vpr,3617,4085,forward,1.9602564102564104,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT -MN692074,nef,3617,4115,forward,1.965040650406504,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,tat_exon1,3823,4084,forward,2.0305555555555554,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY -MN692074,rev_exon1,3823,4084,forward,2.0153846153846153,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY -MN692074,vpu,4080,4164,forward,2.09390243902439,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692074,tat_exon2,4080,4164,forward,2.1133333333333333,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692074,rev_exon2,4080,4164,forward,2.065934065934066,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692145,gag,775,2287,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R* -MN692145,pol,2070,5085,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED* -MN692145,vif,5029,5608,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH* -MN692145,vpr,5547,5841,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T -MN692145,tat_exon1,5818,6037,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ* -MN692145,rev_exon1,5957,6038,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK -MN692145,vpu,6049,6298,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL* -MN692145,env,6212,8783,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL* -MN692145,tat_exon2,8364,8460,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH** -MN692145,rev_exon2,8365,8641,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE* -MN692145,nef,8784,9576,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA* -MN090335,gag,315,1665,forward,0.8911999999999998,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ* -MN090335,pol,1427,4469,forward,0.2169491525423728,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MN090335,vif,4413,5001,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF* -MN090335,vpr,4931,5225,forward,0.5192307692307698,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T -MN090335,tat_exon1,5202,5418,forward,0.45833333333333326,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ -MN090335,rev_exon1,5341,5419,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS -MN090335,vpu,5433,5682,forward,0.6560975609756099,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL* -MN090335,env,5596,8158,forward,0.6022196261682247,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ* -MN090335,tat_exon2,7739,7835,forward,0.3999999999999999,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED** -MN090335,rev_exon2,7740,8016,forward,0.46153846153846145,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE* -MN090335,nef,8159,8819,forward,0.5260162601625942,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H* -MN090376,gag,376,1639,forward,2.1734000000000018,MQTQIVRPF,MFCTIG*FWLTWLLFPGSAAACCVFFLLLFCSSSILSKASLVSFISIL*CTQ*RTATVLNNDLSSSDPV*SAGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTICFNLYLFFPPGLNRIFSHLSNSPPLNTDALAPISLLLASASQKGVLTVRRPSPLAVRASASRVR*FWD*IK**ECIVLPAFWT*DKDQRNPLETM*IGSIKL*EPSKLHRR*KIG*QKPCWSRMQTQIVRPF*KHWVQQLH*KK**QHAREWEDPAIRQEFWRKQ*AK*QTQLP**CRKAILGAKERWLSVSIVAKKGT*PEIAGPLGKGAVGNVERKDTK*KIVLRDRQIF*GKSGLPTRGGQGTFLKAEQNQQPHQRRASVLGRRQQLLLRSRSR*TRNYTLCLPSNHSLATTLSHSKDRGATKGSSIRYRSR* -MN090376,pol,1382,4394,forward,0.18823529411764706,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED* -MN090376,vif,4338,4929,forward,0.41770833333333335,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*NF* -MN090376,vpr,4859,5153,forward,0.44230769230769296,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T -MN090376,tat_exon1,5130,5346,forward,0.5833333333333333,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ -MN090376,rev_exon1,5269,5347,forward,0.723076923076923,MAGRSGDSDEELLRIAGTIKFLYQSS,MAGRSGDSDEELLRIAGTIKFLYQSS -MN090376,vpu,5361,5631,forward,0.7073170731707319,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL* -MN090376,env,5524,8137,forward,0.5484813084112157,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT* -MN090376,tat_exon2,7691,7784,forward,0.4866666666666659,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT* -MN090376,rev_exon2,7692,7968,forward,0.46153846153846145,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE* -MN090376,nef,8111,8735,forward,0.6943089430894234,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC* -MK115581.1,gag,680,2186,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115581.1,pol,1972,4984,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115581.1,vif,4928,5507,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115581.1,vpr,5446,5740,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115581.1,tat_exon1,5717,5936,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115581.1,rev_exon1,5856,5934,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115581.1,vpu,5948,6194,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115581.1,env,6111,8652,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115581.1,tat_exon2,8233,8329,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115581.1,rev_exon2,8234,8519,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115581.1,nef,8653,9274,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115690.1,gag,777,2292,forward,0.1894,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*R* -MK115690.1,pol,2078,5090,forward,0.13958125623130613,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115690.1,vif,5034,5622,forward,0.40104166666666674,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*SF* -MK115690.1,vpr,5552,5846,forward,0.5576923076923082,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*S -MK115690.1,tat_exon1,5823,6039,forward,0.45833333333333326,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ -MK115690.1,rev_exon1,5962,6040,forward,0.6923076923076923,MAGRSGDNDEDLLKTVRFIKLLYQSS,MAGRSGDNDEDLLKTVRFIKLLYQSS -MK115690.1,vpu,6054,6300,forward,0.552439024390244,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL* -MK115690.1,env,6217,8800,forward,0.5558411214953274,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ* -MK115690.1,tat_exon2,8381,8489,forward,0.28666666666666596,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*WMDS* -MK115690.1,rev_exon2,8382,8658,forward,0.4505494505494505,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE* -MK115690.1,nef,8801,9425,forward,0.6089430894308867,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC* -MK115571.1,gag,579,2079,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE* -MK115571.1,pol,1871,4883,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115571.1,vif,4827,5406,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115571.1,vpr,5345,5639,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115571.1,tat_exon1,5616,5832,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115571.1,rev_exon1,5755,5833,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115571.1,vpu,5847,6093,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115571.1,env,6010,8551,forward,0.49065420560747675,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115571.1,tat_exon2,8132,8228,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115571.1,rev_exon2,8133,8418,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115571.1,nef,8552,9173,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115514.1,gag,584,2090,forward,0.2571999999999999,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115514.1,pol,1876,4888,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115514.1,vif,4832,5411,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115514.1,vpr,5350,5644,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115514.1,tat_exon1,5621,5840,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115514.1,rev_exon1,5760,5838,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115514.1,vpu,5852,6098,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115514.1,env,6015,8556,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115514.1,tat_exon2,8137,8233,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115514.1,rev_exon2,8138,8423,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115514.1,nef,8557,9178,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115488.1,gag,707,2213,forward,0.2571999999999999,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115488.1,pol,1999,5011,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115488.1,vif,4955,5534,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115488.1,vpr,5473,5767,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115488.1,tat_exon1,5744,5963,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115488.1,rev_exon1,5883,5961,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115488.1,vpu,5975,6221,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115488.1,env,6138,8679,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115488.1,tat_exon2,8260,8356,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115488.1,rev_exon2,8261,8546,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115488.1,nef,8680,9301,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115030.1,gag,176,1685,forward,0.22580000000000022,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ* -MK115030.1,pol,1477,4567,forward,0.21934197407776668,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL* -MK115030.1,vif,4433,5012,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH* -MK115030.1,vpr,4951,5245,forward,0.5192307692307698,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L -MK115030.1,tat_exon1,5222,5441,forward,0.5972222222222223,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ* -MK115030.1,rev_exon1,5361,5439,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS -MK115030.1,vpu,5453,5699,forward,0.780487804878049,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM* -MK115030.1,env,5616,8217,forward,0.5768691588785053,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL* -MK115030.1,tat_exon2,7798,7891,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD* -MK115030.1,rev_exon2,7799,8075,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE* -MK115030.1,nef,8218,8866,forward,0.7959349593495859,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H* -MK115498.1,gag,663,2169,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115498.1,pol,1955,4967,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115498.1,vif,4911,5490,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115498.1,vpr,5429,5723,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115498.1,tat_exon1,5700,5916,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115498.1,rev_exon1,5839,5917,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115498.1,vpu,5931,6177,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115498.1,env,6094,8635,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115498.1,tat_exon2,8216,8312,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115498.1,rev_exon2,8217,8502,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115498.1,nef,8636,9257,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115211.1,gag,250,1753,forward,0.1938000000000002,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ* -MK115211.1,pol,1545,4557,forward,0.20219341974077754,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED* -MK115211.1,vif,4501,5083,forward,0.39687499999999987,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH* -MK115211.1,vpr,5022,5316,forward,0.4807692307692313,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T -MK115211.1,tat_exon1,5293,5512,forward,0.5694444444444444,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ* -MK115211.1,rev_exon1,5432,5513,forward,0.7115384615384615,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE -MK115211.1,vpu,5524,5794,forward,0.7439024390243905,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL* -MK115211.1,env,5687,8198,forward,1.2061915887850478,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL* -MK115211.1,tat_exon2,7779,7872,forward,0.4866666666666659,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT* -MK115211.1,rev_exon2,7780,8056,forward,0.46153846153846145,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE* -MK115211.1,nef,8199,8838,forward,0.6943089430894234,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAF* -MK115158.1,gag,316,1819,forward,0.3517171717171721,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ* -MK115158.1,pol,1611,4623,forward,0.26447105788423153,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED* -MK115158.1,vif,4567,5149,forward,0.5668393782383419,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH* -MK115158.1,vpr,5088,5379,forward,0.46875,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS* -MK115158.1,tat_exon1,5359,5578,forward,0.5416666666666667,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ* -MK115158.1,rev_exon1,5498,5579,forward,0.75,MAGRSGDSDEELLKITRTIKFLYQNSE,MAGRSGDSDEELLKITRTIKFLYQNSE -MK115158.1,vpu,5590,5860,forward,0.5308641975308646,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL* -MK115158.1,env,5753,8342,forward,0.5740566037735857,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT* -MK115158.1,tat_exon2,7896,7992,forward,0.6935483870967742,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*R -MK115158.1,rev_exon2,7897,8173,forward,0.5274725274725274,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE* -MK115158.1,nef,8316,8994,forward,0.6674757281553398,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAFYKGLSARDFPGEA* -MK114705.1,gag,532,2053,forward,0.21479999999999988,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*R* -MK114705.1,pol,1839,4851,forward,0.17248255234297116,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK114705.1,vif,4795,5383,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*NF* -MK114705.1,vpr,5313,5601,forward,0.46153846153846234,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*T -MK114705.1,tat_exon1,5578,5797,forward,0.6222222222222225,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ* -MK114705.1,rev_exon1,5717,5798,forward,0.8653846153846154,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK -MK114705.1,vpu,5809,6055,forward,0.7963414634146342,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL* -MK114705.1,env,5972,8549,forward,0.5660046728971964,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL* -MK114705.1,tat_exon2,8130,8226,forward,0.9733333333333327,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD** -MK114705.1,rev_exon2,8131,8407,forward,0.5494505494505495,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE* -MK114705.1,nef,8550,9138,forward,0.4593495934959331,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*CVPVCCVTLVTRDPSDHFSQRGKSLAVAPEQGPESESRTRGDLSTQDSAC* -MK114856.1,gag,120,2022,forward,1.871000000000001,MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC,MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ* -MK114856.1,pol,1787,4892,forward,2.003988035892324,ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI,FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*NMEKFSKIPYVYFKESQEIGL* -MK114856.1,vif,4791,5349,forward,1.928125,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH* -MK114856.1,vpr,5033,5582,forward,2.052564102564103,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*T -MK114856.1,tat_exon1,5427,5775,forward,2.1097222222222225,MKLIKILGQE,MKLIKILGQE*KP**EFCNKCCLFISELSVTIAE*ALFCKEEQEIEPVDHRLEP*KHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ -MK114856.1,rev_exon1,5698,5776,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS -MK114856.1,vpu,5790,6039,forward,1.3926829268292686,TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP,MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL* -MK114856.1,env,5953,8557,forward,1.8896028037383144,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*NKWQVVKKLYG* -MK114856.1,tat_exon2,8102,8198,forward,0.8,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED** -MK114856.1,rev_exon2,8103,8379,forward,1.3725274725274725,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE* -MK114856.1,nef,8549,9176,forward,2.0414634146341464,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC* -MK115009.1,gag,302,1715,forward,1.8444000000000005,MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC,MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV* -MK115009.1,pol,1613,4703,forward,1.89531405782652,AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL* -MK115009.1,vif,4590,5148,forward,2.064583333333333,MIVWQVDRMRIRT,MIVWQVDRMRIRT*NSLVKHHMHISKKAQR*VYRHHYESHNPKTSSEVHIPLEEARLVIKTY*GLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTINGH* -MK115009.1,vpr,5087,5381,forward,1.0679487179487188,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*L -MK115009.1,tat_exon1,5412,5574,forward,1.0958333333333334,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ -MK115009.1,rev_exon1,5497,5575,forward,0.7692307692307692,MAGRSRDSDEELLTAVRIIKRLYQSS,MAGRSRDSDEELLTAVRIIKRLYQSS -MK115009.1,vpu,5589,5835,forward,0.9975609756097563,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM* -MK115009.1,env,5752,8353,forward,1.878154205607472,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL* -MK115009.1,tat_exon2,7934,8027,forward,0.6866666666666661,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD* -MK115009.1,rev_exon2,7935,8211,forward,1.3065934065934066,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE* -MK115009.1,nef,8609,8996,forward,1.6390243902439028,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC* -MK115387.1,gag,292,1795,forward,0.20799999999999996,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ* -MK115387.1,pol,1587,4599,forward,0.13160518444665992,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115387.1,vif,4543,5122,forward,0.3041666666666665,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH* -MK115387.1,vpr,5061,5355,forward,0.4038461538461544,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*I -MK115387.1,tat_exon1,5332,5551,forward,0.41666666666666674,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ* -MK115387.1,rev_exon1,5471,5552,forward,0.6346153846153846,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE -MK115387.1,vpu,5563,5809,forward,0.7682926829268295,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL* -MK115387.1,env,5726,8288,forward,0.6280373831775696,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL* -MK115387.1,tat_exon2,7869,7965,forward,0.6000000000000001,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD** -MK115387.1,rev_exon2,7870,8146,forward,0.29670329670329676,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE* -MK115387.1,nef,8289,8940,forward,0.5162601626016183,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC* -MK115491.1,gag,521,2027,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115491.1,pol,1813,4825,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115491.1,vif,4769,5348,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115491.1,vpr,5287,5581,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115491.1,tat_exon1,5558,5777,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115491.1,rev_exon1,5697,5775,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115491.1,vpu,5789,6035,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115491.1,env,5952,8493,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115491.1,tat_exon2,8074,8170,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115491.1,rev_exon2,8075,8360,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115491.1,nef,8494,9115,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK116110.1,gag,0,1557,forward,2.1186000000000007,MVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA,PESESRTREVLSTQDSAC*ALWPGPPTP*HAVIISSSVAAGPNAFKIVLQSGFAFWTNKVSVIQFFTSCEACSALRVL*NRST*SLKGSFGPCFMSKMLTGLYILTILFNPRITHLL*ISPTGIGGLFVIHPICS*RVLVVPAISLPLGSLIWPGATGPACTGCNLSHSAASSLMVSFNICIAA*CPPTVFSMVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA*CTICPWRFCTIG*FWLTWLLFPAPAAACCAFILLLFCSSSILSSAPLVSCISIL*CIQ*RTATVLYNDLSSSDPVWRDGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTRCFNLYFFFPPGLNRIFSHWSNFPPLNTDALAPISLLLASAR*KLFWRTHQSPKQ*AK*IQLP**CRKAILGTKRRLLSVSTVVK*GI*QKIAGPPGERAVGNVDRKDTR*KIVVRDRLIF*GNSGLPTRGGQGISFRADQSQQPHQRRASGLGKRQQLPLRSRSR*TGNYIP* -MK116110.1,pol,1393,4405,forward,0.19680957128614174,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED* -MK116110.1,vif,4349,4928,forward,0.546875,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH* -MK116110.1,vpr,4867,5158,forward,0.48333333333333317,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP* -MK116110.1,tat_exon1,5138,5357,forward,0.6111111111111112,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ* -MK116110.1,rev_exon1,5277,5355,forward,0.5769230769230769,MAGRSGDSDEDLLKAVRLIKILYQSS,MAGRSGDSDEDLLKAVRLIKILYQSS -MK116110.1,vpu,5369,5615,forward,0.48124999999999996,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL* -MK116110.1,env,5532,8073,forward,0.5259128386336873,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL* -MK116110.1,tat_exon2,7654,7750,forward,0.5,RPASQPRGDPTGPKESKKTVERETETDPHA,RPASQPRGDPTGPKESKKTVERETETDPHA** -MK116110.1,rev_exon2,7655,7940,forward,0.48241758241758226,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC* -MK116110.1,nef,8074,8695,forward,0.4668269230769231,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC* -MK115527.1,gag,683,2189,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115527.1,pol,1975,4987,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115527.1,vif,4931,5510,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115527.1,vpr,5449,5743,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115527.1,tat_exon1,5720,5939,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115527.1,rev_exon1,5859,5937,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115527.1,vpu,5951,6197,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115527.1,env,6114,8655,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115527.1,tat_exon2,8236,8332,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115527.1,rev_exon2,8237,8522,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115527.1,nef,8656,9277,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK114997.1,gag,210,1725,forward,0.22980000000000023,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*E* -MK114997.1,pol,1511,4601,forward,0.21934197407776668,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL* -MK114997.1,vif,4467,5046,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH* -MK114997.1,vpr,4985,5279,forward,0.44230769230769296,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L -MK114997.1,tat_exon1,5256,5472,forward,0.5694444444444444,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ -MK114997.1,rev_exon1,5395,5473,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS -MK114997.1,vpu,5487,5733,forward,0.751219512195122,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM* -MK114997.1,env,5762,8216,forward,1.2265186915887858,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*DG* -MK114997.1,tat_exon2,7788,7881,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD* -MK114997.1,rev_exon2,7789,8065,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE* -MK114997.1,nef,8208,8856,forward,0.7959349593495859,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*H* -MK115518.1,gag,739,2245,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115518.1,pol,2031,5043,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115518.1,vif,4987,5566,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115518.1,vpr,5505,5799,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115518.1,tat_exon1,5776,5995,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115518.1,rev_exon1,5915,5996,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK -MK115518.1,vpu,6007,6253,forward,0.6865853658536587,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115518.1,env,6170,8711,forward,0.49018691588785046,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115518.1,tat_exon2,8292,8388,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115518.1,rev_exon2,8293,8578,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115518.1,nef,8712,9333,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115065.1,gag,221,1736,forward,0.24380000000000024,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*K* -MK115065.1,pol,1522,4534,forward,0.20438683948155534,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED* -MK115065.1,vif,4478,5057,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH* -MK115065.1,vpr,4996,5290,forward,0.4807692307692313,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L -MK115065.1,tat_exon1,5267,5486,forward,0.5972222222222223,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ* -MK115065.1,rev_exon1,5406,5484,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS -MK115065.1,vpu,5498,5744,forward,0.751219512195122,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM* -MK115065.1,env,5661,8262,forward,0.5663551401869167,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL* -MK115065.1,tat_exon2,7843,7936,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD* -MK115065.1,rev_exon2,7844,8120,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE* -MK115065.1,nef,8263,8911,forward,0.7471544715447078,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H* -MK115464.1,gag,527,2297,forward,1.495,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ* -MK115464.1,pol,2089,5101,forward,1.8783649052841465,AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED,FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED* -MK115464.1,vif,5045,5624,forward,1.494270833333335,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH* -MK115464.1,vpr,5563,5857,forward,0.5192307692307698,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*I -MK115464.1,tat_exon1,5711,6053,forward,2.118055555555556,MRILGQE,MRILGQE*EP**EFCNNCCLFISELGANIAE*ASLDRGEQEIEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ* -MK115464.1,rev_exon1,5973,6051,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKYLYQSS,MAGRSGDSDEDLLKTVRLIKYLYQSS -MK115464.1,vpu,6065,6347,forward,1.3170731707317076,AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP,MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*YCRPVVGHSLL* -MK115464.1,env,6228,8826,forward,1.8288551401869095,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*DRWQVVKK* -MK115464.1,tat_exon2,8380,8476,forward,0.6000000000000001,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD** -MK115464.1,rev_exon2,8381,8657,forward,0.8274725274725274,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE* -MK115464.1,nef,9064,9496,forward,1.64878048780488,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*HRAFHQGLSRRGVA* -MK115530.1,gag,746,2252,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115530.1,pol,2038,5050,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115530.1,vif,4994,5573,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115530.1,vpr,5512,5806,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115530.1,tat_exon1,5783,6002,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115530.1,rev_exon1,5922,6000,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115530.1,vpu,6014,6260,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115530.1,env,6177,8718,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115530.1,tat_exon2,8299,8395,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115530.1,rev_exon2,8300,8585,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115530.1,nef,8719,9340,forward,0.5918699186991796,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115520.1,gag,695,2195,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE* -MK115520.1,pol,1987,4915,forward,1.3952143569292395,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL*YCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QR*YH*QKKQS*NWQKTGKF*ENQYMECIMTHQKT**QKYRSRAMDSGHIKFIKSHLKI*KQENMQE*GVPTLMM*NN*QRQYKR*PQKA**YGEKLLNLDYLYKKKHGRHGGQSTGKPPGFLSGSLSIPLP**NYGTN*RKNP**EQKLSM*MGQLIEKLN*AKQDMSLTEEDKRLSP*RTQQIKRLSYKQFI*LCRIRDQK*T**QTHNIH*ESFKHNQIRVNQS*SIR**SS**KRKKSTWHGYQHTKELEEMNK*TN*SVLESGEYYF*ME*IRPKKTMRNITVIGEQWLVILIYPL**QKK**PAVINVSKKERPCMDK*IVVQEYGN*IVHI*KGKLSW*QFM*PVDI*KQKLFQQRQGRKQHTFS*N*QGDGQ*KQYIQTMAAISPVMWLRPPVGGQGSSRNLAFPTIPKVKE**NP*IKN*RKL*DR*EIRLNILRQQYKWQYSSTILKEKGGLGGIVQGKE**I**QQTYKLKNYRNKLQKFKIFGFITGTAEIHFGKDQQSFSGKVKGQ**YKIIVI*K* -MK115520.1,vif,4948,5527,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115520.1,vpr,5466,5760,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115520.1,tat_exon1,5737,5956,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115520.1,rev_exon1,5876,5957,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK -MK115520.1,vpu,5968,6214,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115520.1,env,6131,8672,forward,0.49065420560747675,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115520.1,tat_exon2,8253,8349,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115520.1,rev_exon2,8254,8539,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115520.1,nef,8673,9294,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115503.1,gag,817,2323,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115503.1,pol,2109,5121,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115503.1,vif,5065,5644,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115503.1,vpr,5583,5877,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115503.1,tat_exon1,5854,6073,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ* -MK115503.1,rev_exon1,5993,6074,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK -MK115503.1,vpu,6085,6331,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115503.1,env,6248,8789,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115503.1,tat_exon2,8370,8466,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115503.1,rev_exon2,8371,8656,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115503.1,nef,8790,9411,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115570.1,gag,687,2193,forward,0.25119999999999987,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115570.1,pol,1979,4991,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115570.1,vif,4935,5514,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115570.1,vpr,5453,5747,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115570.1,tat_exon1,5724,5940,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115570.1,rev_exon1,5863,5941,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115570.1,vpu,5955,6201,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115570.1,env,6118,8659,forward,0.49649532710280364,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115570.1,tat_exon2,8240,8336,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115570.1,rev_exon2,8241,8526,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115570.1,nef,8660,9281,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115509.1,gag,555,2061,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115509.1,pol,1847,4859,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115509.1,vif,4803,5382,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115509.1,vpr,5321,5615,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115509.1,tat_exon1,5592,5808,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115509.1,rev_exon1,5731,5809,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115509.1,vpu,5823,6069,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115509.1,env,5986,8527,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115509.1,tat_exon2,8108,8204,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115509.1,rev_exon2,8109,8394,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115509.1,nef,8528,9149,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115702.1,gag,246,1782,forward,0.2866000000000015,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ* -MK115702.1,pol,1544,4586,forward,0.18175473579262214,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115702.1,vif,4530,5109,forward,0.34375,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH* -MK115702.1,vpr,5048,5342,forward,0.44230769230769296,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*P -MK115702.1,tat_exon1,5319,5535,forward,0.6319444444444446,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ -MK115702.1,rev_exon1,5458,5536,forward,0.8076923076923077,MAGRSGDGDEDLLKAVRLIKTLYQSS,MAGRSGDGDEDLLKAVRLIKTLYQSS -MK115702.1,vpu,5550,5808,forward,0.807317073170732,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND** -MK115702.1,env,5716,8257,forward,0.6026869158878512,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA* -MK115702.1,tat_exon2,7874,7970,forward,0.6866666666666661,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD** -MK115702.1,rev_exon2,7875,8160,forward,0.3296703296703296,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*CC* -MK115702.1,nef,8275,8896,forward,0.658536585365846,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC* -MK115095.1,gag,2,1697,forward,1.8384000000000005,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC,SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ* -MK115095.1,pol,1489,4579,forward,1.9898305084745753,KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK,FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMSLQTSP* -MK115095.1,vif,4445,5024,forward,1.8546875000000016,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH* -MK115095.1,vpr,4963,5257,forward,0.5961538461538467,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*L -MK115095.1,tat_exon1,5288,5453,forward,1.1236111111111113,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ* -MK115095.1,rev_exon1,5373,5451,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS -MK115095.1,vpu,5465,5711,forward,1.3548780487804881,SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM* -MK115095.1,env,5628,8229,forward,1.8721962616822374,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL* -MK115095.1,tat_exon2,7810,7903,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD* -MK115095.1,rev_exon2,7811,8087,forward,1.2406593406593407,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE* -MK115095.1,nef,8287,8878,forward,0.9788617886178801,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H* -MK115490.1,gag,549,2055,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115490.1,pol,1841,4853,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115490.1,vif,4797,5376,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115490.1,vpr,5315,5609,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115490.1,tat_exon1,5586,5802,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115490.1,rev_exon1,5725,5803,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115490.1,vpu,5817,6063,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115490.1,env,5980,8521,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115490.1,tat_exon2,8102,8198,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115490.1,rev_exon2,8103,8388,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115490.1,nef,8522,9143,forward,0.5918699186991796,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -MK115576.1,gag,468,1974,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R* -MK115576.1,pol,1760,4772,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MK115576.1,vif,4716,5295,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH* -MK115576.1,vpr,5234,5528,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T -MK115576.1,tat_exon1,5505,5721,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ -MK115576.1,rev_exon1,5644,5722,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS -MK115576.1,vpu,5736,5982,forward,0.6865853658536587,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL* -MK115576.1,env,5899,8440,forward,0.49018691588785046,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL* -MK115576.1,tat_exon2,8021,8117,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD** -MK115576.1,rev_exon2,8022,8307,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY* -MK115576.1,nef,8441,9062,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H* -OQ092466,gag,825,2361,forward,0.16679999999999984,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ* -OQ092466,pol,2147,5165,forward,0.14356929212362912,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092466,vif,5109,5688,forward,0.203125,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH* -OQ092466,vpr,5627,5921,forward,0.3653846153846132,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*A -OQ092466,tat_exon1,5898,6114,forward,0.45833333333333326,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ -OQ092466,rev_exon1,6037,6115,forward,0.5769230769230769,MAGRSGDSDDELLKTVRLIKVLYQSS,MAGRSGDSDDELLKTVRLIKVLYQSS -OQ092466,vpu,6129,6375,forward,0.6097560975609757,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL* -OQ092466,env,6292,8902,forward,0.5255841121495328,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*DGWQMVKK* -OQ092466,tat_exon2,8456,8552,forward,0.886666666666666,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH** -OQ092466,rev_exon2,8457,8733,forward,0.3626373626373627,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE* -OQ092466,nef,8876,9509,forward,0.5040650406503988,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC* -OQ092463,gag,801,2313,forward,0.20240000000000014,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ* -OQ092463,pol,2105,5117,forward,0.10767696909272173,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092463,vif,5061,5640,forward,0.296875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH* -OQ092463,vpr,5579,5870,forward,0.30208333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS* -OQ092463,tat_exon1,5850,6066,forward,0.38888888888888884,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ -OQ092463,rev_exon1,5989,6067,forward,0.34615384615384626,MAGRSGDSDEELIKTVRLIKLLYQSS,MAGRSGDSDEELIKTVRLIKLLYQSS -OQ092463,vpu,6081,6330,forward,0.44999999999999996,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL* -OQ092463,env,6244,8827,forward,0.44534746760895216,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL* -OQ092463,tat_exon2,8408,8504,forward,0.6000000000000001,RPTPQPRGDPTGQKESEKKVERETETDPDH,RPTPQPRGDPTGQKESEKKVERETETDPDH** -OQ092463,rev_exon2,8409,8685,forward,0.3296703296703296,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE* -OQ092463,nef,8828,9461,forward,0.29182692307692304,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC* -OQ092465,gag,855,2364,forward,0.3737903225806454,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ*R* -OQ092465,pol,2150,5162,forward,0.1734795613160518,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092465,vif,5106,5685,forward,0.33854166666666674,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH* -OQ092465,vpr,5624,5915,forward,0.17708333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS* -OQ092465,tat_exon1,5895,6111,forward,0.25,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ -OQ092465,rev_exon1,6034,6112,forward,0.5769230769230769,MAGRSGDSDEELIKTVRLIKLLYQSS,MAGRSGDSDEELIKTVRLIKLLYQSS -OQ092465,vpu,6126,6375,forward,0.3063291139240505,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL* -OQ092465,env,6289,8881,forward,0.5249417249417256,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL* -OQ092465,tat_exon2,8462,8558,forward,3.5,RPTSQPRGDPTGQKESKEKVERETETDPDH,RPTSQPRGDPTGQKESKEKVERETETDPDH** -OQ092465,rev_exon2,8463,8739,forward,0.41758241758241765,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE* -OQ092465,nef,8882,9515,forward,0.3285714285714285,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC* -OQ092462,gag,767,2270,forward,0.27679999999999993,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ* -OQ092462,pol,2062,5074,forward,0.1495513459621136,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092462,vif,5018,5597,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH* -OQ092462,vpr,5536,5830,forward,0.32692307692307465,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*P -OQ092462,tat_exon1,5807,6026,forward,0.41666666666666674,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ* -OQ092462,rev_exon1,5946,6024,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKFLYQSS,MAGRSGDSDEELLKAVRLIKFLYQSS -OQ092462,vpu,6038,6284,forward,0.7073170731707319,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL* -OQ092462,env,6201,8844,forward,0.5698598130841122,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*DGWQGVKNEGMGCCKGKNEAN* -OQ092462,tat_exon2,8359,8455,forward,0.4866666666666659,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH** -OQ092462,rev_exon2,8360,8636,forward,0.39560439560439553,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE* -OQ092462,nef,8779,9406,forward,0.7422764227642202,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC* -OQ092464,gag,773,2282,forward,0.38588709677419364,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*R* -OQ092464,pol,2068,5080,forward,0.1734795613160518,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092464,vif,5024,5603,forward,0.29166666666666674,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH* -OQ092464,vpr,5542,5833,forward,0.20833333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS* -OQ092464,tat_exon1,5813,6032,forward,0.25,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ* -OQ092464,rev_exon1,5952,6030,forward,0.5769230769230769,MAGRSGDSDEELLQTVRLIKLLYQSS,MAGRSGDSDEELLQTVRLIKLLYQSS -OQ092464,vpu,6044,6290,forward,0.4265822784810127,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL* -OQ092464,env,6207,8790,forward,0.5058275058275068,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL* -OQ092464,tat_exon2,8371,8467,forward,3.5,RPTSQPRGDPTGQKESKKKVERETETDPDH,RPTSQPRGDPTGQKESKKKVERETETDPDH** -OQ092464,rev_exon2,8372,8648,forward,0.3846153846153846,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE* -OQ092464,nef,8791,9412,forward,0.3542857142857141,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC* -OQ092467,gag,808,2308,forward,0.24380000000000002,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ* -OQ092467,pol,2100,5112,forward,0.14356929212362912,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -OQ092467,vif,5056,5644,forward,0.43229166666666674,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*SF* -OQ092467,vpr,5574,5868,forward,0.4807692307692313,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*T -OQ092467,tat_exon1,5845,6064,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ* -OQ092467,rev_exon1,5984,6065,forward,0.6346153846153846,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK -OQ092467,vpu,6076,6340,forward,0.5439024390243903,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL* -OQ092467,env,6239,8807,forward,0.49988317757009404,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL* -OQ092467,tat_exon2,8388,8484,forward,0.886666666666666,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN** -OQ092467,rev_exon2,8389,8674,forward,0.38351648351648326,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC* -OQ092467,nef,8808,9417,forward,0.6048780487804808,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC* +seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides +KX505501.1,env,0,1824,6224,8795,forward,1.9898364485981306,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,gag,336,1824,789,2292,forward,0.3622000000000025,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vif,1306,1927,5040,5619,forward,2.1463541666666663,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,nef,1306,1927,8796,9417,forward,2.1430894308943085,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,pol,1628,1748,2084,5096,forward,2.1349950149551358,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN*,TTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAG +KX505501.1,tat_exon2,1746,1824,8376,8469,forward,2.12,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1747,1927,6061,6310,forward,2.098780487804878,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,rev_exon2,1747,1927,8377,8653,forward,1.9802197802197803,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,vpr,1748,1751,5558,5850,forward,2.1884615384615382,M,M,ATG +KX505501.1,tat_exon1,1748,1751,5830,6045,forward,2.1875,M,M,ATG +KX505501.1,rev_exon1,1748,1751,5969,6045,forward,2.1653846153846152,M,M,ATG +MN691959,gag,639,2142,789,2292,forward,0.05400000000000005,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN691959,pol,1934,4946,2084,5096,forward,0.03589232303090717,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN691959,vif,4890,5469,5040,5619,forward,0.0625,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG +MN691959,vpr,5408,5702,5558,5850,forward,0.21153846153845945,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MN691959,tat_exon1,5679,5895,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG +MN691959,rev_exon1,5818,5896,5969,6045,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKFLYQSS,MAGRSGDSDEDLLKTVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGT +MN691959,vpu,5910,6156,6061,6310,forward,0.7060975609756097,SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8683,6224,8795,forward,0.0867990654205606,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTAG +MN691959,tat_exon2,8237,8333,8376,8469,forward,0.19999999999999996,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8514,8377,8653,forward,0.16483516483516492,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9278,8796,9417,forward,0.16991869918698432,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,env,2,4115,6224,8795,forward,1.9582943925233647,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,gag,789,2292,789,2292,forward,0.13880000000000003,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692074,pol,2084,4115,2084,5096,forward,0.7912263210369039,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vif,3617,4115,5040,5619,forward,1.9968750000000002,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpr,3617,4085,5558,5850,forward,1.9602564102564104,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACC +MN692074,nef,3617,4115,8796,9417,forward,1.965040650406504,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4084,5830,6045,forward,2.0305555555555554,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4084,5969,6045,forward,2.0153846153846153,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,vpu,4080,4164,6061,6310,forward,2.09390243902439,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,tat_exon2,4080,4164,8376,8469,forward,2.1133333333333333,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4080,4164,8377,8653,forward,2.065934065934066,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692145,gag,775,2287,789,2292,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAG +MN692145,pol,2070,5085,2084,5096,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5608,5040,5619,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5841,5558,5850,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAGACT +MN692145,tat_exon1,5818,6037,5830,6045,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5969,6045,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6061,6310,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6224,8795,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8376,8469,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8377,8653,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9576,8796,9417,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAA +MN090335,gag,315,1665,789,2292,forward,0.8911999999999998,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MN090335,pol,1427,4469,2084,5096,forward,0.2169491525423728,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090335,vif,4413,5001,5040,5619,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAG +MN090335,vpr,4931,5225,5558,5850,forward,0.5192307692307698,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAGACT +MN090335,tat_exon1,5202,5418,5830,6045,forward,0.45833333333333326,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG +MN090335,rev_exon1,5341,5419,5969,6045,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGT +MN090335,vpu,5433,5682,6061,6310,forward,0.6560975609756099,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8158,6224,8795,forward,0.6022196261682247,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7835,8376,8469,forward,0.3999999999999999,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8016,8377,8653,forward,0.46153846153846145,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8819,8796,9417,forward,0.5260162601625942,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGACACTGA +MN090376,gag,376,1639,789,2292,forward,2.1734000000000018,MQTQIVRPF,MFCTIG*FWLTWLLFPGSAAACCVFFLLLFCSSSILSKASLVSFISIL*CTQ*RTATVLNNDLSSSDPV*SAGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTICFNLYLFFPPGLNRIFSHLSNSPPLNTDALAPISLLLASASQKGVLTVRRPSPLAVRASASRVR*FWD*IK**ECIVLPAFWT*DKDQRNPLETM*IGSIKL*EPSKLHRR*KIG*QKPCWSRMQTQIVRPF*KHWVQQLH*KK**QHAREWEDPAIRQEFWRKQ*AK*QTQLP**CRKAILGAKERWLSVSIVAKKGT*PEIAGPLGKGAVGNVERKDTK*KIVLRDRQIF*GKSGLPTRGGQGTFLKAEQNQQPHQRRASVLGRRQQLLLRSRSR*TRNYTLCLPSNHSLATTLSHSKDRGATKGSSIRYRSR*,ATGTTCTGCACTATAGGGTAATTTTGGCTGACCTGGTTGCTATTTCCTGGGTCAGCTGCTGCTTGCTGTGTCTTTTTCTTACTTTTGTTTTGTTCTTCCTCTATCTTGTCTAAAGCTTCCTTGGTGTCTTTTATCTCTATCCTTTGATGCACACAATAGAGGACTGCTACTGTATTAAATAATGATTTAAGTTCCTCTGATCCTGTCTGAAGTGCTGGTTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCCAGTTCCCTGCTTGCCCATACTATATGTTTTAACTTATATCTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATTTGTCTAATTCTCCCCCGCTTAATACCGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAAGGCGTACTCACCGTTCGCCGCCCCTCGCCTCTTGCTGTGCGCGCTTCAGCAAGCCGAGTCCGATAATTCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGA +MN090376,pol,1382,4394,2084,5096,forward,0.18823529411764706,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTGACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAGACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGATGAGCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCTGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTCGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090376,vif,4338,4929,5040,5619,forward,0.41770833333333335,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*NF*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAGCATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGACTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAAAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAG +MN090376,vpr,4859,5153,5558,5850,forward,0.44230769230769296,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T,ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MN090376,tat_exon1,5130,5346,5830,6045,forward,0.5833333333333333,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAG +MN090376,rev_exon1,5269,5347,5969,6045,forward,0.723076923076923,MAGRSGDSDEELLRIAGTIKFLYQSS,MAGRSGDSDEELLRIAGTIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGT +MN090376,vpu,5361,5631,6061,6310,forward,0.7073170731707319,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA +MN090376,env,5524,8137,6224,8795,forward,0.5484813084112157,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAAAATGGGAGGCATATTCTCAAAACGTAA +MN090376,tat_exon2,7691,7784,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MN090376,rev_exon2,7692,7968,8377,8653,forward,0.46153846153846145,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MN090376,nef,8111,8735,8796,9417,forward,0.6943089430894234,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MK115581.1,gag,680,2186,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115581.1,pol,1972,4984,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115581.1,vif,4928,5507,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115581.1,vpr,5446,5740,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115581.1,tat_exon1,5717,5936,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115581.1,rev_exon1,5856,5934,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115581.1,vpu,5948,6194,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115581.1,env,6111,8652,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115581.1,tat_exon2,8233,8329,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115581.1,rev_exon2,8234,8519,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115581.1,nef,8653,9274,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115690.1,gag,777,2292,789,2292,forward,0.1894,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAGTGGGAAAAAATTCGGTTGAGGCCAGGGGGAAAGAAAAAATATAGATTAAAGCATATCGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATAATGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTGTATAATACAGTAGCAACCCTCTATTGTGTACATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGGCGCAGGAAACAGCAGTCAGACCAGCACCAGCCAAAATTACCCTATAGTACAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTCTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACTAATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCCACCAGCATTCTAGACATAAGACAAGGACCAAAGGAGCCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTAGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAGGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGTCATAAAGCAAGAGTTTTAGCGGAAGCAATGAGCCAAGCAACAAATTCAGCTGCCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAAAGTGTTAAGTGTTTTAATTGCGGCAAAGATGGGCACATAGCAAAAAATTGCAGGGCCCCTAGAAGAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTCCAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGGTAG +MK115690.1,pol,2078,5090,2084,5096,forward,0.13958125623130613,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGCACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATAGGGCCTGAGAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGACTTCAGAGAACTAAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGACAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAACCTTATAGAAAACAAAATCCAAACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACCTAGAAATAGGGCAGCATAGAATAAAAATAGAAGAACTGAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGACAAGTGGACAGTACAGCCTATAGCGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATCTACCCAGGAATTAAAGTAAGGCAATTATGTAAACTACTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAAAAGAAGCAGAGCTAGAATTAGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGAGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTGACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTGATATGGGGAAAGACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAATCAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTATCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACATGCAATTTATCTAGCTTTGCAAGATTCGGGATTAGAAGTAAATATAGTAACAGACTCACAGTATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTGTTTTTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAGCAGCATACTTTATTTTAAAATTAGCAGGACGATGGCCAGTAGCAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACAGTTAAGGCCGCCTGCTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAACAATGAATTGAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACGTAATAGCAACAGACTTACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAACATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115690.1,vif,5034,5622,5040,5619,forward,0.40104166666666674,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*SF*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAAGATGGCACAGTTTAGTAAAACACCATATATATATTTCAGGGAAAGCTAGAGGATGGGTTTATAAACATCACTATGAAAACACTCATCCAAGAATAAGTTCAAAAGTATACATCCCACTAGGGGAAGCTAGACTGGCAGTAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGGAATATAGCACACAAGTAGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGTCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTTTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTATTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAG +MK115690.1,vpr,5552,5846,5558,5850,forward,0.5576923076923082,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*S,ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAATCT +MK115690.1,tat_exon1,5823,6039,5830,6045,forward,0.45833333333333326,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAG +MK115690.1,rev_exon1,5962,6040,5969,6045,forward,0.6923076923076923,MAGRSGDNDEDLLKTVRFIKLLYQSS,MAGRSGDNDEDLLKTVRFIKLLYQSS,ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGT +MK115690.1,vpu,6054,6300,6061,6310,forward,0.552439024390244,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*,ATGCAATCTTTAGCAATATTAGCAATAGTAGCATTAGTAGTAGCAGCCATAATAGCAATAGTTGTGTGGACCATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGATAGTGGCAATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG +MK115690.1,env,6217,8800,6224,8795,forward,0.5558411214953274,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*,ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA +MK115690.1,tat_exon2,8381,8489,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*WMDS*,AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAG +MK115690.1,rev_exon2,8382,8658,8377,8653,forward,0.4505494505494505,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*,GACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAG +MK115690.1,nef,8801,9425,8796,9417,forward,0.6089430894308867,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*,ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA +MK115571.1,gag,579,2079,789,2292,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115571.1,pol,1871,4883,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115571.1,vif,4827,5406,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115571.1,vpr,5345,5639,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115571.1,tat_exon1,5616,5832,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115571.1,rev_exon1,5755,5833,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115571.1,vpu,5847,6093,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115571.1,env,6010,8551,6224,8795,forward,0.49065420560747675,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115571.1,tat_exon2,8132,8228,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115571.1,rev_exon2,8133,8418,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115571.1,nef,8552,9173,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115514.1,gag,584,2090,789,2292,forward,0.2571999999999999,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115514.1,pol,1876,4888,2084,5096,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115514.1,vif,4832,5411,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115514.1,vpr,5350,5644,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115514.1,tat_exon1,5621,5840,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115514.1,rev_exon1,5760,5838,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115514.1,vpu,5852,6098,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115514.1,env,6015,8556,6224,8795,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115514.1,tat_exon2,8137,8233,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115514.1,rev_exon2,8138,8423,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115514.1,nef,8557,9178,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115488.1,gag,707,2213,789,2292,forward,0.2571999999999999,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115488.1,pol,1999,5011,2084,5096,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115488.1,vif,4955,5534,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115488.1,vpr,5473,5767,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115488.1,tat_exon1,5744,5963,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115488.1,rev_exon1,5883,5961,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115488.1,vpu,5975,6221,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115488.1,env,6138,8679,6224,8795,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115488.1,tat_exon2,8260,8356,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115488.1,rev_exon2,8261,8546,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115488.1,nef,8680,9301,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115030.1,gag,176,1685,789,2292,forward,0.22580000000000022,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK115030.1,pol,1477,4567,2084,5096,forward,0.21934197407776668,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGA +MK115030.1,vif,4433,5012,5040,5619,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK115030.1,vpr,4951,5245,5558,5850,forward,0.5192307692307698,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTT +MK115030.1,tat_exon1,5222,5441,5830,6045,forward,0.5972222222222223,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115030.1,rev_exon1,5361,5439,5969,6045,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115030.1,vpu,5453,5699,6061,6310,forward,0.780487804878049,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*,ATGCATATCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115030.1,env,5616,8217,6224,8795,forward,0.5768691588785053,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115030.1,tat_exon2,7798,7891,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115030.1,rev_exon2,7799,8075,8377,8653,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115030.1,nef,8218,8866,8796,9417,forward,0.7959349593495859,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGACACTGA +MK115498.1,gag,663,2169,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115498.1,pol,1955,4967,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115498.1,vif,4911,5490,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115498.1,vpr,5429,5723,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115498.1,tat_exon1,5700,5916,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115498.1,rev_exon1,5839,5917,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115498.1,vpu,5931,6177,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115498.1,env,6094,8635,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115498.1,tat_exon2,8216,8312,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115498.1,rev_exon2,8217,8502,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115498.1,nef,8636,9257,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115211.1,gag,250,1753,789,2292,forward,0.1938000000000002,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAGATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAAGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACACAGGACATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCATTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAGCCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAAACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAAATGCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA +MK115211.1,pol,1545,4557,2084,5096,forward,0.20219341974077754,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAGAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCTGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATTTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTACCACCTGTAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGGCAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGTAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA +MK115211.1,vif,4501,5083,5040,5619,forward,0.39687499999999987,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MK115211.1,vpr,5022,5316,5558,5850,forward,0.4807692307692313,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115211.1,tat_exon1,5293,5512,5830,6045,forward,0.5694444444444444,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAAGACTGCTTGCACCAGTTGCTATTGTAAAAGGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA +MK115211.1,rev_exon1,5432,5513,5969,6045,forward,0.7115384615384615,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG +MK115211.1,vpu,5524,5794,6061,6310,forward,0.7439024390243905,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTATTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA +MK115211.1,env,5687,8198,6224,8795,forward,1.2061915887850478,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MK115211.1,tat_exon2,7779,7872,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MK115211.1,rev_exon2,7780,8056,8377,8653,forward,0.46153846153846145,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MK115211.1,nef,8199,8838,8796,9417,forward,0.6943089430894234,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAF*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGACAGCGAGCTTTCTAA +MK115158.1,gag,316,1819,234,1731,forward,0.3517171717171721,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAACAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACCCAGGAAATAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCTTTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACGATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAACCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA +MK115158.1,pol,1611,4623,1526,4535,forward,0.26447105788423153,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTCTACCAGGAAGATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATGGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTGCATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCTCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACTTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAGGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAGGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA +MK115158.1,vif,4567,5149,4479,5061,forward,0.5668393782383419,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGTTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACGGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MK115158.1,vpr,5088,5379,5000,5291,forward,0.46875,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTGGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115158.1,tat_exon1,5359,5578,5271,5486,forward,0.5416666666666667,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA +MK115158.1,rev_exon1,5498,5579,5410,5486,forward,0.75,MAGRSGDSDEELLKITRTIKFLYQNSE,MAGRSGDSDEELLKITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG +MK115158.1,vpu,5590,5860,5502,5748,forward,0.5308641975308646,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL*,ATGCAATCCTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTTGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA +MK115158.1,env,5753,8342,5665,8212,forward,0.5740566037735857,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTGAAAATGTTAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGGGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTATATCTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAAAATGGGAGGCATATTCTCAAAACGTAA +MK115158.1,tat_exon2,7896,7992,7793,7886,forward,0.6935483870967742,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*R,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGC +MK115158.1,rev_exon2,7897,8173,7794,8070,forward,0.5274725274725274,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MK115158.1,nef,8316,8994,8213,8834,forward,0.6674757281553398,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAFYKGLSARDFPGEA*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGACAGCGAGCTTTCTACAAGGGACTTTCCGCTAGGGACTTTCCAGGGGAGGCGTGA +MK114705.1,gag,532,2053,789,2292,forward,0.21479999999999988,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGCGAATTAGATAGATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCGGTTAATCCTGGCCTGTTAGAAACATCAGAGGGCTGTAGGCAAATACTGGGACAGCTACAACCGTCCCTTCAAACAGGATCAGAAGAACTTAAATCATTATTTAATACAATAGCAGTCCTTTATTGCGTACATCAAAGGATAGATGTAAAAGACACCAAGGAAGCTCTAAATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGTCAGAGCAGTCAAGTCAGCCAAAATTACCCTATAGTGCAGAACCATCAGGGGCAAATGGTATATCAGGCTCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCCGAGGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAGGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGGACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCATGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTATCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCTTTTAGAGATTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAAGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTCTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCAGCCACAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGCAACAGGTGGTGCAACTAACATAATGATGCAGAAAGGCAATTTTAGGAACCAAGGAAAACCTATTAAGTGTTTCAATTGTGGCAAAGAAGGGCACCTAGCTAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCTCTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAAAGATAG +MK114705.1,pol,1839,4851,2084,5096,forward,0.17248255234297116,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTAAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAACCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCCGTATTTGCCATAAAGAAAAAGGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAGCTTAATAAAAGAACTCAAGACTTTTGGGAGGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTCTCAGTTCCTTTAGATGAAAGCTTCAGAAAGTATACTGCATTTACCATACCTAGTACTAACAATGAGACACCCGGGATTAGGTATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTTCAAAGTAGCATGACGAAAATCTTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTACCAATACATGGATGATTTATACGTAGGATCTGACTTAGAAATAGAGCAGCATAGAGCAAAAGTAGAGAACCTGAGAGAGCATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAGCATCAGAAAGAACCTCCATTTCTTTGGATGGGCTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAGCTAAGGCACTAACAGAAGTGATAACACTAACAGAAGAAGCAGAGCTAGAATTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAGTAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACCTATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAAGCAGTTCAAAAAATAGCCACAGAGAGCATAGTAGTATGGGGAAAGATTCCTAAATTTAGATTACCCATACAGAAAGAAACATGGGAAACATGGTGGATGGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAGTACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGGCAAAAAGTTATCCCCTTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGACAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAGAAGGTCTACCTGACATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCAGGAATCAGGAAAATACTATTTTTGGATGGAATAGATAAGGCCCAGGAAGATCATGAGAAATATCATAGTAATTGGAAAGCAATGGCTAGTGATTTTAACATACCACCTGTGGTAGCAAAAGAGATAATAGCCAGCTGTGATAAATGTCAGCTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTCCATGTAGCCAGTGGGTACATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAATAATACATACAGATAATGGTAGCAATTTCACCAGCACTACAGTCAAGGCCGCCTGCTGGTGGGCAGGTGTTAAGCAGGAGTTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTGGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGAGTACTGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTGCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATCAAAGTAGTACCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK114705.1,vif,4795,5383,5040,5619,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*NF*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTCTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGGTTTACAGACACCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAACACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATATGTACTATTTTGATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTGCAATACCTGGCACTAGCAGTATTAGTAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTCGCGAGACTGACAGAGGATAGATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAG +MK114705.1,vpr,5313,5601,5558,5850,forward,0.46153846153846234,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*T,ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAGACT +MK114705.1,tat_exon1,5578,5797,5830,6045,forward,0.6222222222222225,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*,ATGGAGCCCGTAGATCCTAGACTGGAACCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTAACAATTGCTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGCTTCACAAAAAAGGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAA +MK114705.1,rev_exon1,5717,5798,5969,6045,forward,0.8653846153846154,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK,ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG +MK114705.1,vpu,5809,6055,6061,6310,forward,0.7963414634146342,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*,ATGCAACCTTTAGAGATATCAGCAATAGTAGCATTAGTAGTAGTAGCAATAATAGCAATAGTTGTGTGGACCATAGTACTCTTAGAGTATAGGAAAATATTAAGGCAAAAGAAAATAGACAGATTAATTAATAGAATAAGTGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG +MK114705.1,env,5972,8549,6224,8795,forward,0.5660046728971964,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*,ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MK114705.1,tat_exon2,8130,8226,8376,8469,forward,0.9733333333333327,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD**,AGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGA +MK114705.1,rev_exon2,8131,8407,8377,8653,forward,0.5494505494505495,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*,GACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAG +MK114705.1,nef,8550,9138,8796,9417,forward,0.4593495934959331,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*CVPVCCVTLVTRDPSDHFSQRGKSLAVAPEQGPESESRTRGDLSTQDSAC*,ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCATTTTAGTCAGCGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGGAGATCTCTCGACGCAGGACTCGGCTTGCTGA +MK114856.1,gag,120,2022,789,2292,forward,1.871000000000001,MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC,MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ*,ATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTGGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGTTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGGCTCAAATCTGGTCCAACCAGAGAGACCCAGTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAAAGGCGGCGACTGGTGAGTACGCCATTTTTGACTAGCAGAGGCTAGAAGGAGAAAGATAGGTGCGAGAGCGTCAGTATTGAGCAGAGGAGAATTAGATAGATAGGAGAAAATTCAGTTAAGGCCAAGGAGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAAGGAACTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGGAGGCTGTAAACAGATATTAGAACAGCTACAACCATCCCTTCAGACAAGATCAGAAGAACTTAGATCATTATATAATACAGTAGCCACCCTCTATTATGTACATCAAAAGATAGATGTAAAAGACACCAAAGAAGCGTTAGACAAAGTAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCGGCAGCTGACACAAGAAACAGAGGCCAGACCAGTCAAAATTTCCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAGGCCATATCACCTAGAACTTTAAATGCATAAGTAAAAGTAGTAGAAGAAAAAGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACTATGCTAAACACAGTAAGTAGACACCAAGCAGCTATGCAAATGTTAAAAAAGGTCATCAATGAAGAAGCTGCAGAATAAGATAGATTACATCCAGTGCATGCAAGGCCTATTGCACCAGGCCAGATAAGAGAACCAAAAAGAAGTGACATAGCAAGAACTACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAAGAAAGATTTATAAAAGATAAATAATTCTAGGACTAAATAAAATAGTAAAAATGTATAGCCCTACCAGCATTTTAGACATAAAGCAAAGGCCAAAAGAACCCTTTAGAGACTATGTAGACCAGTTCTATAAAACTTTAAGAGCCAAGCAAGCTACACAGAAAGTAAAAAATTAGATGACAAAAACCTTGTTAGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAAAAAGTAAGAAGACCCGGCCATAAAGCAAAAGTTTTAGCTGAAGCAATGAGCCAAGCAACAGGTGCAGCCAACATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAAAGCACATAGCCAAAAATTGCAAGGCCCCTAAGAAAAAAGGCTGTTAGAAATATAGAAAAGAAAGACACCAAATGAAAAATTGCACTAAGAGACAGGCTAATTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MK114856.1,pol,1787,4892,2084,5096,forward,2.003988035892324,ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI,FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*NMEKFSKIPYVYFKESQEIGL*,TTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAAGAGAGCAACTAAAGAAAGCTTTATTAAATACAGGAGCAGATGATACAGTATTAGAAGACATAGATTTGCCAAGAAAATAGAAACCAAAAATGATAAGAAGAATTAGAAGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCAGACACAAAGCTATAAGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTAGAAGAAATCTGTTGACTCAGCTTAGTTGCACTCTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAAGAATGGACGGCCCAAAAGTTAAACAATAGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATAGAAAAAGAAAAGAAAATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATAGAAAAAATTAGTAGATTTCAGAGAACTTAATAAGAAAACTCAAGATTTCTAAGAAATTCAATTAAGTATACCACATCCTGCAAAGCTAAAAAAGAAAAAATCAGTCACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAAGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAAAGATTAGATATCAGTATAATGTGCTTCCACAAAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTAGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAAGGCAACATAGAACAAAAGTAAAGGAACTGAGGCAACATCTAATGAGGTAAAGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTAGATGAGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAAGAAAGTTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAATTGAATTAGGCAAGTCAGATTTATGCAAAGATTAAAGTGAAGCAATTATGTAAGCTCCTTAAAAGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAAAGATTCTAAAAGATCCAGTACATAGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAAAGAGAAGGTCAGTGGACATATCAAATTTATCAAAAGCCATTTAAAAATCTAAAAACAGAGAAATATGCAAGAACGAAAGGTGCCCATACTAATGATGTAAAGCAATTAACAGAAGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATAAAGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATAAGAAACATAGTGGACAGATTATTGGCAAGCCACCTAGATCCCTAAGTAAGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATAGTACCAGTTAGAAAAAGAACCCATAATAAGAGCAGAAACCTTCTATGTAGATAAGGCAGCTAATAAAGATAATAAATCAAGAAAAGCAAGATATGTTACTGACAGAAGAAGACAAAAAGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAAGATTCAGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAAAGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGAAAAAAGTCTACCTGGCATAAGTGCCAGCCCACAAAAGAATTAAAAGAAATGAACAGGTAAATAAACTAGTCAGTGCTAGAATCAAGAAAGTACTATTTTTAGATAAAATAGAAAAAGCCCAAGAAGACCATAAAAAATATCACAGTAATTAAAGAACAATGGCTAGTAATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAAAAGAAGCTATGCATAGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAAGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAAGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTAGTAGGCAAAAATCAAGCAAGAATTTAGTATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAAAATCTATAAATAATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAGAAATAGGCTTATAG +MK114856.1,vif,4791,5349,5040,5619,forward,1.928125,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH*,ATGATTGTGTGGCAAGTAGACAGGATGAAGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAGAAATAGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGAGGTGCTAGATTAGTAATAACAACATATTAAGGTCTGCATACAGGAGAAAAAGACTGGCATTTAGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAG +MK114856.1,vpr,5033,5582,5558,5850,forward,2.052564102564103,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*T,ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACT +MK114856.1,tat_exon1,5427,5775,5830,6045,forward,2.1097222222222225,MKLIKILGQE,MKLIKILGQE*KP**EFCNKCCLFISELSVTIAE*ALFCKEEQEIEPVDHRLEP*KHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,ATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG +MK114856.1,rev_exon1,5698,5776,5969,6045,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGT +MK114856.1,vpu,5790,6039,6061,6310,forward,1.3926829268292686,TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP,MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*,ATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAG +MK114856.1,env,5953,8557,6224,8795,forward,1.8896028037383144,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*NKWQVVKKLYG*,ATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTAGAAAAATAACATGGTAGACCAGATGCATGAGGATATAATCAATTTATGAGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAAAAATAATACTGTAGGAAATCAAACAAATTATCATCTCAATGAAACTAATACAATACAAAGAAAAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAATATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAAAGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTAGTTTTGCAATTCTAAAGTGTAAAGATGAGATGTTCAATAGAACAAGACCATGTAAGAATGTCAGCACAGTACAATGTACACATAGAATTAGACCAGTAGTGTCAACTCAACTGCTGTTAAATAGTAGCCTAGCAGAAAAAAAGATAGTACTTAGATCTGAAAATTTCACAGACAATACTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAAAGAGAGCAATTTATGCAACAAGACAGATAATAGAAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGAAGTGACACTTTAAGCAAAATAGTTGAAAAATTAAAGGAAAAATTTAGAAAAAATAAAACAATAATCTTTAAGCAATCATCAAGAGAGGACATAGAAATTGAAACGCACAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGAAGTGTTAATAGAACTAGCATAAACAGAACTAACAATAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATCAACAGGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCTATCAGTAAGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATAGTAGTACAACTAATAGTAAAGAAGAGACCTTCAGACCTAGAGAAAGAAATATGAAGGACAATTAGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAAAAGTAGCACCCACCAAGGCACAAAGAAAAGTAGTGCAGAGAGAAAAAAGAGCAATAAGAACGTTAGGAGCTATGTTCCTCAGGTTCTTAAGAACAGCAGGAAGCACTATAGGCGCAGCGTCACTGACGCTGACAGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTAAGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTAGAAAGATACCTACAAGATCAACAGCTCCTGAAGATTTGAAGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATACTAGTTAGAGCAATAAATCTTACAGTACCATCTAAGATAACATGACCTAGATGCAGTAGGACAGAGAAATTCAAAATTACACAAAGATAATATACAACTTACTTAAAGAATCGCAAATCCAACAGAAAAAGAATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAAAATAAGTGGCAAGTAGTCAAAAAGTTGTATGGCTAG +MK114856.1,tat_exon2,8102,8198,8376,8469,forward,0.8,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED**,AGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGA +MK114856.1,rev_exon2,8103,8379,8377,8653,forward,1.3725274725274725,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*,GACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAG +MK114856.1,nef,8549,9176,8796,9417,forward,2.0414634146341464,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGCTAGATAGCCTGCTGTAAAAGAAAGAATAGAAAGAGTTAATCCAAGGCCTGCTGCAAAGAAAGAACAAGCTGAGCCAGCAGCAGCTAAGGTAAGAGCAGCATCTCGAGACTTAGAAAAATATAGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTAGCTAGAAGCACAAGAGGAAGAAGAAGTAGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTAAATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTAGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGAAATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATAGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MK115009.1,gag,302,1715,789,2292,forward,1.8444000000000005,MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC,MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*,ATGGGTGCTAGAGCGTCAGTATTAAGCGGCGGAAAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGAAGGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATAGTACATCAACCATTATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAAGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATAGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAAGAACCAAGAGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAAGGCTAAACAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAAGAACCCTTTAAAGATTATGTAGACCGATTCTATAAAACTCTAAAGGCTGAGCAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAAGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATAGTGCAAGGAGGCAATTTTAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAAGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAAAAATGTAGAAAGGAAAGACACCAAATGAAAGATTGTACTAAGAGACCAGACTAAGACGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGA +MK115009.1,pol,1613,4703,2084,5096,forward,1.89531405782652,AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGAGGAAGAGGCAACAGCTCCTCCTCAGAAGCAGGAGACGAAAGACCAAGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATGATAAAAAGAATTAGAAGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACGCCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGTCAGGAATAGATAGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAGGAAAAGAAAATTACAAAAATTAGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAAAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTAAGAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGAAGTTAAATATCAGTACAATGTGCTTCCACAGAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAGGTGAGGACTCACCACACCAGACAAGAAACATCAGAAAAAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTGATAAATAGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTGAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGAGGAGAGACCAATAGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGAAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAGAAAATGTGGTGGACAAAGTATTGGCAAGCCACCTAGATTCCTGAGTAAGAATTTGTCAATACCCCTCCCTTAGTAAAACTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAAATAAGGCAGCTAATAGAAAGACTAAATTAAGAAAAGCAGAGTATGTTACGGACAGAAGAAGACAAAAGGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAGATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTGAAGGAAATGAACAAGTAGATAAATTAGTCAGTAATAGAATCAGAAGAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAGAGAGCAATGGCTAGTAATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATAGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATAGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAAGCCGCCTGTTAGTAGGCAGAGATCAAGCAGGAATTTAGTATTCCCTACAATCCTCAAAGTCAAAGAGTAGTAAAATCTATGAATAATAAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATAGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATAGGTTTACAGACATCACTATGA +MK115009.1,vif,4590,5148,5040,5619,forward,2.064583333333333,MIVWQVDRMRIRT,MIVWQVDRMRIRT*NSLVKHHMHISKKAQR*VYRHHYESHNPKTSSEVHIPLEEARLVIKTY*GLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTINGH*,ATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATAGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATAGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGAGGAAGCAAGATTGGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAG +MK115009.1,vpr,5087,5381,5558,5850,forward,1.0679487179487188,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*L,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTT +MK115009.1,tat_exon1,5412,5574,5830,6045,forward,1.0958333333333334,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,ATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG +MK115009.1,rev_exon1,5497,5575,5969,6045,forward,0.7692307692307692,MAGRSRDSDEELLTAVRIIKRLYQSS,MAGRSRDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115009.1,vpu,5589,5835,6061,6310,forward,0.9975609756097563,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*,ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG +MK115009.1,env,5752,8353,6224,8795,forward,1.878154205607472,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATAAAGTACCTGTATAGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTAGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTAGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAACTTGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATGAAAGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTAATGTAGTACCAATAGATGAAGATAGTAAAAATACTACGGGCAAATATAAGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTAAACGGCAGTCTAGCAGAAGAAAAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATAGAACAGACATAATAAGAGATATAAGACAAGCGCATTATAACATTAGTAAGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGAAGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAGTACTTAGAATAGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAAGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTAGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTAGAGGAAGAGATATGAAGGACAATTAGAGAAGTAAATTATATAAATATAAAGTAGTCAAAATTAAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAAGGAAAAAAGAGCAATAAGACTTGAAGCTTTCTTCCTTAGGTTCTTAAGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACAGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAAAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTAAGGATTTAAAGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAAGAAAAAGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA +MK115009.1,tat_exon2,7934,8027,8376,8469,forward,0.6866666666666661,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAG +MK115009.1,rev_exon2,7935,8211,8377,8653,forward,1.3065934065934066,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115009.1,nef,8609,8996,8796,9417,forward,1.6390243902439028,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*,ATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115387.1,gag,292,1795,789,2292,forward,0.20799999999999996,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAGGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACACAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAAGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCGCAGGATGTAAAAAATTGGATGACAGAAACCTTATTGGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MK115387.1,pol,1587,4599,2084,5096,forward,0.13160518444665992,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAGGGAAGATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAGAAATCAATAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAATAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATGGATGACTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTGGGGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAGACAATTATGTAAACTCCTTAAGGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGGGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGGGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATGGGATACCTGGTGGACAGAATATTGGCAAGCCACCTGGATTCCCGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAAAAAGAACCTATTGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAGGAATAATTCAAGCACAACCAGATAGGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAGGGTCTACCTTGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTCCTATTTTTGGATGGAATAGATAAGGCCCAAGAGGAGCATGAGAAATATCACAATAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAGGGAGAAGCCACGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTGGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115387.1,vif,4543,5122,5040,5619,forward,0.3041666666666665,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAGGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGCAGGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAG +MK115387.1,vpr,5061,5355,5558,5850,forward,0.4038461538461544,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*I,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGATT +MK115387.1,tat_exon1,5332,5551,5830,6045,forward,0.41666666666666674,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA +MK115387.1,rev_exon1,5471,5552,5969,6045,forward,0.6346153846153846,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG +MK115387.1,vpu,5563,5809,6061,6310,forward,0.7682926829268295,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*,ATGCAATCCTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTGGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAGGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG +MK115387.1,env,5726,8288,6224,8795,forward,0.6280373831775696,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115387.1,tat_exon2,7869,7965,8376,8469,forward,0.6000000000000001,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115387.1,rev_exon2,7870,8146,8377,8653,forward,0.29670329670329676,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAG +MK115387.1,nef,8289,8940,8796,9417,forward,0.5162601626016183,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA +MK115491.1,gag,521,2027,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115491.1,pol,1813,4825,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115491.1,vif,4769,5348,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115491.1,vpr,5287,5581,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115491.1,tat_exon1,5558,5777,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115491.1,rev_exon1,5697,5775,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115491.1,vpu,5789,6035,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115491.1,env,5952,8493,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115491.1,tat_exon2,8074,8170,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115491.1,rev_exon2,8075,8360,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115491.1,nef,8494,9115,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK116110.1,gag,0,1557,140,1643,forward,2.1186000000000007,MVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA,PESESRTREVLSTQDSAC*ALWPGPPTP*HAVIISSSVAAGPNAFKIVLQSGFAFWTNKVSVIQFFTSCEACSALRVL*NRST*SLKGSFGPCFMSKMLTGLYILTILFNPRITHLL*ISPTGIGGLFVIHPICS*RVLVVPAISLPLGSLIWPGATGPACTGCNLSHSAASSLMVSFNICIAA*CPPTVFSMVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA*CTICPWRFCTIG*FWLTWLLFPAPAAACCAFILLLFCSSSILSSAPLVSCISIL*CIQ*RTATVLYNDLSSSDPVWRDGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTRCFNLYFFFPPGLNRIFSHWSNFPPLNTDALAPISLLLASAR*KLFWRTHQSPKQ*AK*IQLP**CRKAILGTKRRLLSVSTVVK*GI*QKIAGPPGERAVGNVDRKDTR*KIVVRDRLIF*GNSGLPTRGGQGISFRADQSQQPHQRRASGLGKRQQLPLRSRSR*TGNYIP*,CCTGAAAGCGAAAGTAGAACCAGAGAAGTTCTCTCGACGCAGGACTCGGCTTGCTGAGCTTTATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCTGGTCCCAATGCTTTTAAAATAGTCTTACAATCTGGGTTTGCATTTTGGACCAACAAGGTTTCTGTCATCCAATTTTTTACATCCTGTGAAGCTTGCTCGGCTCTTAGGGTTTTATAGAACCGGTCTACATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTTTTATGTCCAAAATGCTGACAGGACTATACATTCTTACTATTTTATTTAATCCCAGGATTACCCATCTTTTATAGATATCTCCTACTGGGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTGCTATATCACTTCCCCTTGGTTCTCTCATTTGGCCTGGTGCAACAGGCCCTGCATGCACTGGATGCAATCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAATATTTGCATTGCTGCTTGATGTCCCCCCACTGTATTTAGCATGGTGTTTATATCTTGTGGGGTGGCTCCTTCTGCTAATGCTGAAAACATAGGTATTACTTCTGGGCTAAAAGCCTTTTCTTCTACTACTTTTACCCATGCATTTAAAGTTCTAGGTGACATGGCCTGATGTACCATTTGCCCCTGGAGGTTTTGCACTATAGGGTAGTTTTGGCTGACCTGGCTGTTATTTCCTGCGCCAGCTGCTGCTTGCTGTGCTTTCATCTTGCTTTTGTTTTGCTCTTCCTCTATCTTATCTAGCGCTCCCTTGGTGTCTTGTATCTCTATCCTTTGATGTATACAATAGAGGACCGCTACTGTATTATATAATGATTTAAGCTCTTCTGACCCTGTTTGGAGGGATGGCTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTGCCCATACTAGATGTTTTAACCTATATTTTTTCTTTCCTCCTGGCCTTAACCGAATTTTTTCCCATTGGTCTAATTTTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGGTAAAAACTTTTTTGGCGTACTCACCAGTCGCCGAAGCAATGAGCCAAGTAAATTCAACTACCGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAAGAAGACTGTTAAGTGTTTCAACTGTGGTAAAATAGGGCATATAGCAAAAAATTGCAGGGCCCCCAGGAGAAAGGGCTGTTGGAAATGTGGACAGGAAGGACACCAGATGAAAGATTGTAGTGAGAGACAGGCTAATTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAG +MK116110.1,pol,1393,4405,1435,4447,forward,0.19680957128614174,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED*,TTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAAAAGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGTGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGATCAGATACCCATAGAAATCTATGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATTTGTTGACTCAGATTGGGTGCACTTTAAATTTTCCCATTAGTCCTATCGAAACTGTACCAGTAAGATTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAGATTTCAAAGATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAGAGAACTCAAGATTTCTGGGAAGTTCAATTGGGAATACCGCATCCCGCAGGATTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCATTAGATAAAGACTTTAGGAAGTATACTGCATTTACCATACCCAGTGTAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAGCTAGCATGACAAAAATTTTAGAGCCTTTTAGGAAGCAAAATCCAGACATGGTTATTTATCAATACATGGATGATCTATATATAGGATCTGACTTGGAATTAGGACAGCATAGGACAAAAATAGAGGAACTGAGACAACATCTATTGAGGTGGGGGTTTACCACACCAGACAAGAAGCATCAGAAAGAACCTCCATTCCTCTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAACACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTAGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAGGCAGTTATGTAAACTCCTTAGAGGAACCAAATCACTAACAGAAGTAGTACCACTAACAAGAGAGGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAATTACAAAAGCAGGGACAAGGCCAGTGGACTTATCAGATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATAAAGGGTACCCACACTAATGATGTAAAACAATTAACACAGGCTGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGACCCCATAGTAGGAGCAGAAACATTCTATGTCGATGGGGCAGCCAATAGGGATACTAAATTAGGAAAAGCAGGATATGTTACTGACAGGGGAAGACAAAAAATTGTCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTTACCTAGCTCTGCAGGATTCAGGATCAGAAGTAAACATAGTATCAGACTCACAGTATGCAATAGGAATTCTTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGACATGGGTGCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTATTATTCTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCCATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGTTAAAAGGAGAAGCCATACATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTGGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTGGCCAGTGGATATATTGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATATTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAACACAATACATACAGACAATGGCAGCAACTTCACTAGCACTGCGGTTAAAGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGGGATCAAGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGAGGTACAGTGCAGGGGAAAGAATAGTAGACATGATAGCATCAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGACTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAA +MK116110.1,vif,4349,4928,4391,4970,forward,0.546875,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAATGCATGGAAAAGCTTAGTAAAGCACCATATGCATGTTTCAAGGAAAGTTGAGAGATGGGTTTATAAACATCACTATGAAAGTACTAATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAAAAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAAGAGCTATAATACACAAGTAGACCCTGAAGTAGCAGACCAACTAATCCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAAAGCCATAGTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCCCTACAGTACTTGGCATTAGCAGCATTAGTAAAATCAAAAAAGACAAAGCCACCTTTGCCTAGCGTTACGAAGCTGACGGAGGATAGATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAG +MK116110.1,vpr,4867,5158,4909,5200,forward,0.48333333333333317,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP*,ATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGGATATGGCTTCAGAGCTTAGGACAATACGTCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTTTGCAACAAATGCTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACGAGGGAGAACAAGAAATGGAGCCAGTAGACCCTAG +MK116110.1,tat_exon1,5138,5357,5180,5395,forward,0.6111111111111112,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ*,ATGGAGCCAGTAGACCCTAGCCTAGCGCCCTGGAAGCACCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGCTATTGTAAAAAGTGCTGCTTACATTGCCAAGTTTGTTTCACAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAA +MK116110.1,rev_exon1,5277,5355,5319,5395,forward,0.5769230769230769,MAGRSGDSDEDLLKAVRLIKILYQSS,MAGRSGDSDEDLLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGT +MK116110.1,vpu,5369,5615,5411,5657,forward,0.48124999999999996,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL*,ATGCAATCTTTGCAAATAGGAGCAATAGTAGCATTAGTAGTAGGAACAATAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAAGAAAATAGATAGAATAATAGATAGAATAGTAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAG +MK116110.1,env,5532,8073,5574,8124,forward,0.5259128386336873,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL*,ATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAGTGCTGCAACAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACGCATGCCTGTGTACCCACGGACCCCAACCCACAAGAAGTATTATTGGGAAATGTGACAGAAGATTTTAATGCATGGAAAAATAACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTTTGTGTTATTTTGCATTGCACTGATGTCAACAATACTAGAAATGGGATGACAGGAGAACTAAAAAACTGCTCTTTCAATATCACCACAAAAATAACAAATAAGGTACAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTACCAATAAATAATAAGGATAATGATACTAGCTTTAATAATAATAGCTATAGGTTGATAAGTTGTAACACCTCAGTTATTACACAGGCTTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTACTGTACCCCGGCTGGTTATGCAATTCTAAGGTGTAACAATGAGACATTCAGTGGAAAAGGGCCATGTACAAATGTCAGCTCAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGCAGTCTAGCAAAACAGGAGGTAGTAATTAGATCTCAAAATTTCTCGGACAATGTTAAAACCATAATAGTACAGCTGAAGACCCCTGTAAAAATTAACTGTACAAGGCCCAATAACAATACAAGAAAAAGTATACATGCAGGACCAGGGAAAGTAATTTATGCAACAGGAGAAATAATAGGAGATATAAGACAAGCACATTGCAACATTAGTGCAGCAGAGTGGAATGATACTTTAGGACAGATAGTTACAAAATTACAAGAACAATTTGGGAATAAAACAATAGTCTTCAATCAATCGTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTTTACTGTAATTCAACACAACTGTTTAATAGTACTTGGAATAATAATGGTACTAATACTTGGAATAGTACAGGTAATATCACACTCCCATGTAAAATAAGGCAAATTGTAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCTCCTCCCATCCGTGGACAAATTAAATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAACGAGAGTGAGAGCGAAACCTTCAGACCTGGCGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGACTAGCACCCACTAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAACACTGGGAGCTGTGTTCCTTGGGTTCTTGGGAACAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATTAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGCAATAAATCTCTGAATGAAATTTGGGATAACATGACCTGGATGGAGTGGGAAAAAGAAATTAGTAATTACACACAATTAATATACACTTTAATTGAAGAATCGCAGAGCCAGCAAGAAAAGAATGAACAAGAATTATTGGCACTAGATAAGTGGGACAGCTTGTGGAGTTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAATAGGGTTAAGAATAGTTTTTACTGTACTTTCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTGTCATTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTAGTACAAAGAGCTTGTAGAGCTATTCTCCACATACCTGTAAGACTAAGACAAGGCTTAGAAAGAGCTTTGCTATAA +MK116110.1,tat_exon2,7654,7750,7705,7798,forward,0.5,RPASQPRGDPTGPKESKKTVERETETDPHA,RPASQPRGDPTGPKESKKTVERETETDPHA**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAA +MK116110.1,rev_exon2,7655,7940,7706,7982,forward,0.48241758241758226,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAG +MK116110.1,nef,8074,8695,8125,8752,forward,0.4668269230769231,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTGTAAGGGAAAGAATAAGAAGAGCTGGGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGACAAACATGGAGCAATCACAAGTAACAATACACCAGCTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTTAGGCCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATGATATACTCCCAGCAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGACCAGGGGTCAGGTTTCCACTGACCTTTGGATGGTGCTTCAAACTAGTACCACTTGAGACAGAGCAGGTAGAAGCGGCCACTGGAGGAGAGAACAACTGCTTGTTACACCCTTTGAACCAGCATGGGATGGATGACCCGGAGAGAGAAGTACTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAGAGCCAAAGAGCTGCATCCGGAGTACTACAAAGACTGCTGA +MK115527.1,gag,683,2189,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115527.1,pol,1975,4987,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115527.1,vif,4931,5510,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115527.1,vpr,5449,5743,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115527.1,tat_exon1,5720,5939,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115527.1,rev_exon1,5859,5937,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115527.1,vpu,5951,6197,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115527.1,env,6114,8655,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115527.1,tat_exon2,8236,8332,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115527.1,rev_exon2,8237,8522,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115527.1,nef,8656,9277,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK114997.1,gag,210,1725,789,2292,forward,0.22980000000000023,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*E*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACACAATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGCACTTTAAATGCATGGGTAAAAGTGATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGATCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCCTCCATAATGGCGCAAGGAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAGAATAG +MK114997.1,pol,1511,4601,2084,5096,forward,0.21934197407776668,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAGAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGACAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACCAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTCCATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTAACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCCGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGA +MK114997.1,vif,4467,5046,5040,5619,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTAGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCCTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK114997.1,vpr,4985,5279,5558,5850,forward,0.44230769230769296,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTT +MK114997.1,tat_exon1,5256,5472,5830,6045,forward,0.5694444444444444,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG +MK114997.1,rev_exon1,5395,5473,5969,6045,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK114997.1,vpu,5487,5733,6061,6310,forward,0.751219512195122,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK114997.1,env,5762,8216,6224,8795,forward,1.2265186915887858,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*DG*,ATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAAGATGGGTAA +MK114997.1,tat_exon2,7788,7881,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK114997.1,rev_exon2,7789,8065,8377,8653,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK114997.1,nef,8208,8856,8796,9417,forward,0.7959349593495859,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*H*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGACACTGA +MK115518.1,gag,739,2245,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115518.1,pol,2031,5043,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115518.1,vif,4987,5566,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115518.1,vpr,5505,5799,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115518.1,tat_exon1,5776,5995,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115518.1,rev_exon1,5915,5996,5969,6045,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115518.1,vpu,6007,6253,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115518.1,env,6170,8711,6224,8795,forward,0.49018691588785046,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115518.1,tat_exon2,8292,8388,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115518.1,rev_exon2,8293,8578,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115518.1,nef,8712,9333,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115065.1,gag,221,1736,789,2292,forward,0.24380000000000024,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*K*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCCAAGGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGCTGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAG +MK115065.1,pol,1522,4534,2084,5096,forward,0.20438683948155534,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGATTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTATCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAAATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCTATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAGTGGAATCAGAAAAGTACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115065.1,vif,4478,5057,5040,5619,forward,0.38020833333333326,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK115065.1,vpr,4996,5290,5558,5850,forward,0.4807692307692313,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTT +MK115065.1,tat_exon1,5267,5486,5830,6045,forward,0.5972222222222223,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115065.1,rev_exon1,5406,5484,5969,6045,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115065.1,vpu,5498,5744,6061,6310,forward,0.751219512195122,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115065.1,env,5661,8262,6224,8795,forward,0.5663551401869167,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115065.1,tat_exon2,7843,7936,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115065.1,rev_exon2,7844,8120,8377,8653,forward,0.4285714285714286,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115065.1,nef,8263,8911,8796,9417,forward,0.7471544715447078,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGACACTGA +MK115464.1,gag,527,2297,789,2292,forward,1.495,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGCTTCAGGCCATCCCTGGTTTGAGGGTGGGTCCCGCCGGGTCCCACCCCTTTGCACTCACGAGCCTGTCTGCCTCCTGCTGCCATCAATCACAGAGCCCAGGCTGTTCGGGCGCCACTGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGAGGCGGCGACTGGTGAGTACGCCAATTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAAGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAAGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACAAAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATAGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATAAGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATAGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCACAGGATGTAAAAAATTAGATGACAGAAACCTTATTAGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTAAGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAAGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MK115464.1,pol,2089,5101,2084,5096,forward,1.8783649052841465,AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED,FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATAAGTTTGCCAGGAAGATAGAAACCAAAAATGATAGAAGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATAACTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTAGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAACCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAAAAAAGATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAGAAAATTAGTAGATTTCAAGGAACTTAATAAAAGAACTCAAGACTTCTAAGAAGTTCAATTAAGAATACCACACCCCGCAAGGTTAAAAAAGAAGAAATCAATAACAGTACTAGATGTAGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAAGAAGTATACTGCATTTACCATACCTAGTATAAATAATAAGACACCAGAGATTAGATATCAGTACAATGTGCTTCCACAGGGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATAGATGACTTGTATGTAAGATCTGACTTAGAAATAAGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTAGAGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATAAGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTAAGAAAATTGAATTGAGCAAGTCAGATTTATGCAGAGATTAAAGTGAGACAATTATGTAAACTCCTTAAAGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAAGAAATTCTAAAAGAACCAGTACATGAAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGAGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGAGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGAGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATAAGATACCTAGTGGACAGAATATTGGCAAGCCACCTAGATTCCCGAGTAAGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATAGTACCAATTAGAAAAAGAGCCTATTGTAGGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAAAGAGACTAAATTAAGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAAGAATAATTCAAGCACAACCAGATAAGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTACCTTGCATAGGTACCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTGCTAGAATCAGGAAAGTCCTATTTTTAGATAGAATAGATAAGGCCCAAGAAGAGCATAAGAAATATCACAATAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAAAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAAAAAGAAGCCACGCATAGACAAGTAGACTGTAGTCCAAGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTAGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTAGTAGGCAAAGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAAGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115464.1,vif,5045,5624,5040,5619,forward,1.494270833333335,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAAGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTAGGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGTCAAGGAGTCTCCATAGAATGGAAGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAG +MK115464.1,vpr,5563,5857,5558,5850,forward,0.5192307692307698,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*I,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATT +MK115464.1,tat_exon1,5711,6053,5830,6045,forward,2.118055555555556,MRILGQE,MRILGQE*EP**EFCNNCCLFISELGANIAE*ASLDRGEQEIEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA +MK115464.1,rev_exon1,5973,6051,5969,6045,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKYLYQSS,MAGRSGDSDEDLLKTVRLIKYLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGT +MK115464.1,vpu,6065,6347,6061,6310,forward,1.3170731707317076,AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP,MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*YCRPVVGHSLL*,ATGCAATCTTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTAGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAAGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAA +MK115464.1,env,6228,8826,6224,8795,forward,1.8288551401869095,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*DRWQVVKK*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAG +MK115464.1,tat_exon2,8380,8476,8376,8469,forward,0.6000000000000001,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115464.1,rev_exon2,8381,8657,8377,8653,forward,0.8274725274725274,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAG +MK115464.1,nef,9064,9496,8796,9417,forward,1.64878048780488,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*HRAFHQGLSRRGVA*,ATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGACATAGAGCTTTCCACCAGGGACTTTCCAGAAGAGGCGTGGCCTAG +MK115530.1,gag,746,2252,789,2292,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115530.1,pol,2038,5050,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115530.1,vif,4994,5573,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115530.1,vpr,5512,5806,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115530.1,tat_exon1,5783,6002,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115530.1,rev_exon1,5922,6000,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115530.1,vpu,6014,6260,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115530.1,env,6177,8718,6224,8795,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115530.1,tat_exon2,8299,8395,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115530.1,rev_exon2,8300,8585,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115530.1,nef,8719,9340,8796,9417,forward,0.5918699186991796,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115520.1,gag,695,2195,789,2292,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115520.1,pol,1987,4915,2084,5096,forward,1.3952143569292395,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL*YCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QR*YH*QKKQS*NWQKTGKF*ENQYMECIMTHQKT**QKYRSRAMDSGHIKFIKSHLKI*KQENMQE*GVPTLMM*NN*QRQYKR*PQKA**YGEKLLNLDYLYKKKHGRHGGQSTGKPPGFLSGSLSIPLP**NYGTN*RKNP**EQKLSM*MGQLIEKLN*AKQDMSLTEEDKRLSP*RTQQIKRLSYKQFI*LCRIRDQK*T**QTHNIH*ESFKHNQIRVNQS*SIR**SS**KRKKSTWHGYQHTKELEEMNK*TN*SVLESGEYYF*ME*IRPKKTMRNITVIGEQWLVILIYPL**QKK**PAVINVSKKERPCMDK*IVVQEYGN*IVHI*KGKLSW*QFM*PVDI*KQKLFQQRQGRKQHTFS*N*QGDGQ*KQYIQTMAAISPVMWLRPPVGGQGSSRNLAFPTIPKVKE**NP*IKN*RKL*DR*EIRLNILRQQYKWQYSSTILKEKGGLGGIVQGKE**I**QQTYKLKNYRNKLQKFKIFGFITGTAEIHFGKDQQSFSGKVKGQ**YKIIVI*K*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATATGGGAAATGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAG +MK115520.1,vif,4948,5527,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115520.1,vpr,5466,5760,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115520.1,tat_exon1,5737,5956,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115520.1,rev_exon1,5876,5957,5969,6045,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115520.1,vpu,5968,6214,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115520.1,env,6131,8672,6224,8795,forward,0.49065420560747675,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115520.1,tat_exon2,8253,8349,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115520.1,rev_exon2,8254,8539,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115520.1,nef,8673,9294,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115503.1,gag,817,2323,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115503.1,pol,2109,5121,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115503.1,vif,5065,5644,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115503.1,vpr,5583,5877,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115503.1,tat_exon1,5854,6073,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115503.1,rev_exon1,5993,6074,5969,6045,forward,0.6346153846153846,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115503.1,vpu,6085,6331,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115503.1,env,6248,8789,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115503.1,tat_exon2,8370,8466,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115503.1,rev_exon2,8371,8656,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115503.1,nef,8790,9411,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115570.1,gag,687,2193,789,2292,forward,0.25119999999999987,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCGACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115570.1,pol,1979,4991,2084,5096,forward,0.14456630109670976,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115570.1,vif,4935,5514,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115570.1,vpr,5453,5747,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115570.1,tat_exon1,5724,5940,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115570.1,rev_exon1,5863,5941,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115570.1,vpu,5955,6201,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115570.1,env,6118,8659,6224,8795,forward,0.49649532710280364,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115570.1,tat_exon2,8240,8336,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115570.1,rev_exon2,8241,8526,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115570.1,nef,8660,9281,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115509.1,gag,555,2061,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115509.1,pol,1847,4859,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115509.1,vif,4803,5382,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115509.1,vpr,5321,5615,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115509.1,tat_exon1,5592,5808,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115509.1,rev_exon1,5731,5809,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115509.1,vpu,5823,6069,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115509.1,env,5986,8527,6224,8795,forward,0.49135514018691584,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115509.1,tat_exon2,8108,8204,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115509.1,rev_exon2,8109,8394,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115509.1,nef,8528,9149,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115702.1,gag,246,1782,789,2292,forward,0.2866000000000015,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGCGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAGGAAACGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGCTTCGCAGTCAACCCTGGCCTGTTAGAAACATCAGAAGGCTGCAAACAAATAATGGGACAACTCCAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAGAGGATAGATGTAAAGGATACCAAAGAAGCTTTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCCGCTGACACAGGAAACAACAGCCAAGTCAGCCAAAATTACCCCATAGTGCAGAACATGCAGGGACAAATGGTACATCAGGCCATATCACCCAGAACCCTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCATTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAGGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCAGGCAGGACCTGTTGCACCAGGCCAGATAAGGGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACACATAATCCACCCGTCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAGACTCTAAGAGCTGAGCAAGCTTCACAGGAAGTAAAAGGTTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCAGCCATAAGGCAAGGGTTTTGGCAGAAGCAATGAGCCAAGCAACAGGTGCACATGCCATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAA +MK115702.1,pol,1544,4586,2084,5096,forward,0.18175473579262214,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAAAGATAGGGGGGCAAATAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGAAATGGCGTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATAGCCATAGAAATTTGTGGACATAAAGCAATTGGTACAGTATTAGTAGGACCTACACCTGTCAATATAATTGGAAGAAATCTATTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAGTTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATAGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAGTGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGATTAAAAAAGAAAAAATCAATAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGATGAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATATTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGACGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGAGGACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAGGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAGATGGACAGTACAGCCTATAAAGCTGCCAGAGAAAGAAATCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATTAAAGTAAAACAATTATGTAAACTCCTTAGGGGAACCAAAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGAATTAATAGCAGAAATACAGAAGCAAGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCGAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAGAAAATATCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAGGAAACATGGGAAATATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTTAGTACTCCTCCCCTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCATCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATATTACTGACAGAGGAAGACAAAAGGTTGTCACCCTAAATGACACAACCAATCAAAAGACAGAGTTACAAGCAATTCTTCTAGCATTGCAGGATTCAGGATTAGAAGCAAACATAGTGACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGATCTACCTGACATGGGTACCAGCACATAAAGGAATTGGAGGAAATGAGCAAGTAGATAAATTAGTCAGTACTGGGATTAGGAAAGTATTATTTTTAGATGGAATAGATAGGGCCCAAGAAGAGCATGAGAGATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTCAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAATAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACACTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTACCACAGTTAAGGCCGCCTGTTGGTGGGCGGGGGTCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTGGTAGAATCTATGAATAAAGAATTAAAGAAAATAATAGGACAGGTCAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTTCAAAAATTCAAAACTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCGGTAGTAATACAGGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115702.1,vif,4530,5109,5040,5619,forward,0.34375,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAAGAAAACTAAGGGATGGTTTTATAGACATCACTATGAGAGCACTCATCCAAAAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTGAGTTGGTAGTAACAACATATTGGGGTTTGCAGCCAGGGGAAAGGGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAGGGAGATATAGAACACACGTGGACCCTAACCTAGCAGACCAACTAATTCATCTGCATTACTTTGATTGTTTTTCAGAATCTGCTATAAGACATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAAGAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACTAAACTAACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +MK115702.1,vpr,5048,5342,5558,5850,forward,0.44230769230769296,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*P,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAACCT +MK115702.1,tat_exon1,5319,5535,5830,6045,forward,0.6319444444444446,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAG +MK115702.1,rev_exon1,5458,5536,5969,6045,forward,0.8076923076923077,MAGRSGDGDEDLLKAVRLIKTLYQSS,MAGRSGDGDEDLLKAVRLIKTLYQSS,ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGT +MK115702.1,vpu,5550,5808,6061,6310,forward,0.807317073170732,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**,ATGTTATCTTTAGAAGTAATAGTAGCAATAACAGCATTAGTAGTAGCAGGAATAATAGCAATAGTTGTGTGGACCATAGTACTTATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAAGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA +MK115702.1,env,5716,8257,6224,8795,forward,0.6026869158878512,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*,ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA +MK115702.1,tat_exon2,7874,7970,8376,8469,forward,0.6866666666666661,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD**,AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA +MK115702.1,rev_exon2,7875,8160,8377,8653,forward,0.3296703296703296,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*CC*,GACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAG +MK115702.1,nef,8275,8896,8796,9417,forward,0.658536585365846,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*,ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA +MK115095.1,gag,2,1697,789,2292,forward,1.8384000000000005,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC,SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,TCTGGTTTCTCTTTCACTTTCAAGTCCCTGTTCGGGCGCCATCTAGGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCACGGCAAGAGGCGAGGCGCGGCGACTAGTGAGTACGCCGAAATTTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGGGAGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAAAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAACCCATATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAAGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAAGCTGCAGAATAAGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAGGAACCAAGAAGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATAGATAATCCTGAGGTTAAATAAAATAGTAAAAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAGGAACCCTTTAAGGATTATGTAGACCGGTTCTATAAAACTCTAAAGGCTGAACAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAAGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATGGTGCAAGGAGGCAATTTAAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAGAAATGTGGAAAGAAAGGACACCAAATGAAAGATTGTACTAAGAGACAGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK115095.1,pol,1489,4579,2084,5096,forward,1.9898305084745753,KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK,FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMSLQTSP*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAAGAAGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAAAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATAATAGAAGGAATTAGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAAAAATTTGTAGACATAAAGCTATAAGTACAGTATTAATAAGACCTACACCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAAGAAAGGAAAATTACAAAAATTAGGCCTAAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATAGAGAAAATTAGTAGATTTCCGAGAACTTAATAAAAGAACACAAGACTTTTAAAAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAAGAGTTAGATATCAGTACAATGTGCTTCCACAAAGATAGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAAGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAAGTAAAGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTAAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAAGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAGGAGATTCTAAAAGAACCAGTACATAGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGAGGAGACCAATGGACATATCAAATTTATCAGAAGCCATTTAAAAATCTGAAAACAAAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATAGAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAAGAAATGTAGTAGACAGAGTATTGGCAAGCCACCTAGATTCCTGAGTAGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAGAGAGACTAAATTAAGAAAAGCAAGGTATGTTACGGACAGAAGAAGACAAAAAGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAAATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTAGTAGAATCAGAAAAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAAGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAGGCCGCCTGTTAGTAGGCAAGGATCAAGCAGAAATTTAGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAAGGGGGATTGGGGGGTACAGTGCAGAGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTAGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGAGTTTACAGACATCACCATGA +MK115095.1,vif,4445,5024,5040,5619,forward,1.8546875000000016,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGAGTTTACAGACATCACCATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAAGGGAAGCAAGATTAGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGGCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAG +MK115095.1,vpr,4963,5257,5558,5850,forward,0.5961538461538467,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*L,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAACTT +MK115095.1,tat_exon1,5288,5453,5830,6045,forward,1.1236111111111113,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*,ATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCCATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115095.1,rev_exon1,5373,5451,5969,6045,forward,0.6538461538461537,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115095.1,vpu,5465,5711,6061,6310,forward,1.3548780487804881,SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG +MK115095.1,env,5628,8229,6224,8795,forward,1.8721962616822374,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATGAGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAAGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATGAATTAAATCTAAATTGCCCTAACAATAATACTTGTAGTAATAATACTAAATATAATATGACGGAAGAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAAGTAGTGGAAATACTACAGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAAGGAGGGCATTTTATAGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTAGGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAAAGGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAAGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAATACTTAGAATGGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATAGTAAGAGCAACAATAGTAGTAATGATACAAAGACCTTCAGGCCTAGAAGAGGAGATATGAAGGACAATTAGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAGAAAGAAAAAAGAGCAATAGGACTTAGAGCTTTCTTCCTTAAGTTCTTAGGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTGAAGATTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTAATGTGCCCTAAAATGTTAGTTAGAGCCCTAGATAGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAGGAAAAAGAAATTGACAATTATACAGACACAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAA +MK115095.1,tat_exon2,7810,7903,8376,8469,forward,0.4866666666666659,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAG +MK115095.1,rev_exon2,7811,8087,8377,8653,forward,1.2406593406593407,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115095.1,nef,8287,8878,8796,9417,forward,0.9788617886178801,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*,ATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGACACTAA +MK115490.1,gag,549,2055,789,2292,forward,0.2571999999999999,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115490.1,pol,1841,4853,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115490.1,vif,4797,5376,5040,5619,forward,0.36979166666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115490.1,vpr,5315,5609,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115490.1,tat_exon1,5586,5802,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115490.1,rev_exon1,5725,5803,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115490.1,vpu,5817,6063,6061,6310,forward,0.6500000000000001,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115490.1,env,5980,8521,6224,8795,forward,0.4941588785046729,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115490.1,tat_exon2,8102,8198,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115490.1,rev_exon2,8103,8388,8377,8653,forward,0.4285714285714286,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115490.1,nef,8522,9143,8796,9417,forward,0.5918699186991796,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +MK115576.1,gag,468,1974,789,2292,forward,0.2571999999999999,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAG +MK115576.1,pol,1760,4772,2084,5096,forward,0.14755732801595212,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115576.1,vif,4716,5295,5040,5619,forward,0.35416666666666674,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115576.1,vpr,5234,5528,5558,5850,forward,0.4038461538461544,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MK115576.1,tat_exon1,5505,5721,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115576.1,rev_exon1,5644,5722,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115576.1,vpu,5736,5982,6061,6310,forward,0.6865853658536587,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115576.1,env,5899,8440,6224,8795,forward,0.49018691588785046,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115576.1,tat_exon2,8021,8117,8376,8469,forward,0.28666666666666596,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115576.1,rev_exon2,8022,8307,8377,8653,forward,0.39560439560439553,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAG +MK115576.1,nef,8441,9062,8796,9417,forward,0.6162601626016186,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGA +OQ092466,gag,825,2361,789,2292,forward,0.16679999999999984,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTAGCCTGTTAGAAACAGCAGAAGGCTGTAGACAAATATTGGGACAGTTACAACCGTCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACATTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCCTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGCAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGCCAGGTTAGACACACAGGAAACAGCAGCCAGGTCAGCCAAAATTACCCTATAGTACAGAACCTTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGACTACATCCAGTGCATGCAGGGCCCATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTACACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGGGGACCCGGACATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCACGTAACAAATTCAAGTGCCATAATGATGCAGAGGGGCAATTTTAGAAACCAAAGAAAGGCTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092466,pol,2147,5165,2084,5096,forward,0.14356929212362912,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGGGCAGATGATACAGTATTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAGGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTATTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGTATGACAAAAATCTTAGAGCCTTATAGAACACGAAATCCAGAAATGGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGACTTAGAAATAGGGCAACATAGAGCAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGATTTACTACCCCAGACAAAAAACATCAAAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAAACAAAGACAGCTGGACTGTCAATGACATACAGAAACTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCGCTAACAGAAGAAGCAGAGTTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGGGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGGAAGGACAATGGACATTTCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGCGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAGGCATAGTAATATGGGGAAAAATTCCTAAATTTAGACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATACGCATTGGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTGATAAAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTGCTGGAATCAGGAAAGTATTATTTTTAGATGGAATAGAGAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGCTAAAAGGAGAAGCCATACATGGACAGGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATACGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATCCAAACCAAAGAACTACAAAAACAAATTATAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTTATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092466,vif,5109,5688,5040,5619,forward,0.203125,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAGGAAAGCTAAGGGATGGTTTTATAGACATCACTTTGAAAGCAATCATCCAAAAATAAGTTCAGAAGTACACATCCCACTGGAGGATGCTAGACTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGGGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTACTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACACATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGAGAAAGCCACCCTTGCCTAGTGTTAAGAAGCTAACAGAAGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +OQ092466,vpr,5627,5921,5558,5850,forward,0.3653846153846132,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*A,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGGCT +OQ092466,tat_exon1,5898,6114,5830,6045,forward,0.45833333333333326,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAG +OQ092466,rev_exon1,6037,6115,5969,6045,forward,0.5769230769230769,MAGRSGDSDDELLKTVRLIKVLYQSS,MAGRSGDSDDELLKTVRLIKVLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGT +OQ092466,vpu,6129,6375,6061,6310,forward,0.6097560975609757,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*,ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA +OQ092466,env,6292,8902,6224,8795,forward,0.5255841121495328,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*DGWQMVKK*,ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAAGATGGGTGGCAAATGGTCAAAAAGTAA +OQ092466,tat_exon2,8456,8552,8376,8469,forward,0.886666666666666,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH**,AGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGA +OQ092466,rev_exon2,8457,8733,8377,8653,forward,0.3626373626373627,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*,GATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAG +OQ092466,nef,8876,9509,8796,9417,forward,0.5040650406503988,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*,ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092463,gag,801,2313,140,1643,forward,0.20240000000000014,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAGCGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAACACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGACCAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTCAGGAACCAGAGAAAGAATGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092463,pol,2105,5117,1435,4447,forward,0.10767696909272173,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAGTCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAGCTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAGCAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCTATAGTAGGAGCAGAAACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGACCATGAGAAATATCACAGTAATTGGAGGGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGGTATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCAGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092463,vif,5061,5640,4391,4970,forward,0.296875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTATTCATCCAAGAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAGGAGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATCGGTATTACTTTGATTGTTTTTCAGAATCTGCCATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092463,vpr,5579,5870,4909,5200,forward,0.30208333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTCCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAACAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAACCAGTAGATCCTAG +OQ092463,tat_exon1,5850,6066,5180,5395,forward,0.38888888888888884,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,ATGGAACCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG +OQ092463,rev_exon1,5989,6067,5319,5395,forward,0.34615384615384626,MAGRSGDSDEELIKTVRLIKLLYQSS,MAGRSGDSDEELIKTVRLIKLLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT +OQ092463,vpu,6081,6330,5411,5657,forward,0.44999999999999996,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGAAATATCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG +OQ092463,env,6244,8827,5574,8124,forward,0.44534746760895216,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTATGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATACCACTAGTACCAAGAATACCACCCCTAGTACCACTGCTAGTAGCGGGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGAAGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAAGGATTCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTCTTGGAAGGATGAGTCAAATGGCACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAATAATGAGAGCAACACCACCGAGATTTTCAGACCTGAAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAGAGAAATTGACAATTACACAAGCTTGATATACACTTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGACAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCAACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092463,tat_exon2,8408,8504,7705,7798,forward,0.6000000000000001,RPTPQPRGDPTGQKESEKKVERETETDPDH,RPTPQPRGDPTGQKESEKKVERETETDPDH**,AGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092463,rev_exon2,8409,8685,7706,7982,forward,0.3296703296703296,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092463,nef,8828,9461,8125,8752,forward,0.29182692307692304,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGATTGCTGA +OQ092465,gag,855,2364,200,1700,forward,0.3737903225806454,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGGTGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAACTAGAACGGTTTGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAACAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGTACAGCAAGCAGCAACTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAATCTCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGACTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTGCCATAATGATGCAGAGAGGCAATTTCAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAG +OQ092465,pol,2150,5162,1492,4504,forward,0.1734795613160518,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTTTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAAGACAGTTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAGACTCCTTAAGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGACAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAGCTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTTTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACCACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATCCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAAGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGTGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATACCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATACACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092465,vif,5106,5685,4448,5027,forward,0.33854166666666674,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGATTTATAAGCATCACTATGACAGTATTAATCCAAAAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCAAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCGACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGGTCTCTACAGTACTTGGCACTAACAGCACTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092465,vpr,5624,5915,4966,5257,forward,0.17708333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTACACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCCTTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092465,tat_exon1,5895,6111,5237,5452,forward,0.25,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG +OQ092465,rev_exon1,6034,6112,5376,5452,forward,0.5769230769230769,MAGRSGDSDEELIKTVRLIKLLYQSS,MAGRSGDSDEELIKTVRLIKLLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT +OQ092465,vpu,6126,6375,5468,5708,forward,0.3063291139240505,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGTAATATCAGCAATAGTAGCATTAGTAGTAGTAGCGATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGGGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG +OQ092465,env,6289,8881,5631,8208,forward,0.5249417249417256,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGCGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTGTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACTGGTGCCAATAATACCACTAGTACCAATACTACCACCCCTAGTACCACTGTTAGTAGCGAGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGACGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAAACATAATAGTACATCTGAATAAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGAGCAGGTATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGGTGAAGGGTCAAACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTACTATTAACAAGAGATGGTGGTAACGAGAGCGAGACCACCGACACTGAGACCTTCAGACCTGTAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGATTAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAAATCTGACACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCAGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092465,tat_exon2,8462,8558,7789,7882,forward,3.5,RPTSQPRGDPTGQKESKEKVERETETDPDH,RPTSQPRGDPTGQKESKEKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092465,rev_exon2,8463,8739,7790,8066,forward,0.41758241758241765,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092465,nef,8882,9515,8209,8842,forward,0.3285714285714285,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTAAAATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAACCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092462,gag,767,2270,789,2292,forward,0.27679999999999993,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAGCTAAAACATATAGTATGGGCAAGCAGGGAACTAGAGCGATTTGCAGTTAATCCCGGCCTGTTAGAAACATCGGAGGGCTGTAGACAAATACTAGGGCAACTACAGCCCGCTCTTCAGACAGGATCAGAAGAACTTAAATCACTATTTCATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTGAAAGACACCAAAGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAAGAAAAGTAAGAAAAAGGCACAGCAAGCAGCCGCTGACACAGGAAATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGACAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGATAAGGCTTTCAGTCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCAGGCAGGGCCTGTTGCGCCAGGCCAGCTACGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAGCAAATAGCATGGATGACACATAATCCACCTGTCCCAGTAGGAGAAATCTATAAAAGATGGATACTTCTGGGATTAAATAAAATAGTAAGAATGTACAGCCCCGTCAGCATTCTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCTGAGCAGGCTTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAGCAAATCCAGCTAGCATAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGCCTATTAAGTGTTTCAACTGTGGCAAAGAGGGGCATATTGCTAAAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092462,pol,2062,5074,2084,5096,forward,0.1495513459621136,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTTTTAGAAGAAATGAATTTGCCAGGAAAATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGCTGCACTTTAAATTTTCCCATTAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATCTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAGAAAGATGGTAATAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCTGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAGGACTTCAGGAAGTATACTGCATTTACAATACCTAGCACAAACAATGAGACACCAGGGATTAGATACCAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTGGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATTTATCAATACATGGATGATTTATATGTAGGGTCTGACTTAGAAATAGGGCAGCATAGAGCAAAAATAGAGGAACTGAGACAACATCTATTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCCGATAAATGGACAGTACAGCCTATATTGCTGCCAGAAAAAGACAGCTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATCAAAGTAAGGCAGCTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTGGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGATTTAATAGCAGAACTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATATAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGAGGTACCCACACTAATGATATAAAACAATTAACAGAGGCAGTGCAAAAAATAGCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAATTACCCATACAAAAGGAAACATGGGAAGCATGGTGGATAGAGTATTGGCAAGCCACCTGGATTCCTGAATGGGAGTTTGTCAATACCCCTCCCTTAGTGAAACTATGGTACCAGTTGGAAAAAGAACCCATAGTGGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAAACTAAATTAGGAAAAGCAGGATATGTTACTGACAAAGGAAGACAAAAAGTTGTCCCCCTAACGGACACAACAAATCAGAAGACTGAGCTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAACTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAGTTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTATAGTAGCAAAGGAAATAGTAGCCAGTTGTGACAAATGTCAGTTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCTGGAATATGGCAGCTAGATTGTACACATCTAAAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTGAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCTGCCTGTTGGTGGGCGGGGATCAAACAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCAGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCGTCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACCAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATCAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092462,vif,5018,5597,5040,5619,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAGAGTTTAGTAAAACATCATATGCATATATCAAGGAAAGCTAAGAATTGGTTGTATAGACATCACTATGAAAGCATTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAGTAATAACAACATATTGGGGTCTGCTTACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAGGAGATATAGAACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCTTATTAGGACGTGTAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACCAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAG +OQ092462,vpr,5536,5830,5558,5850,forward,0.32692307692307465,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*P,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAGCCT +OQ092462,tat_exon1,5807,6026,5830,6045,forward,0.41666666666666674,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*,ATGGATCCAGTAGATCCTAGCCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGTTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAA +OQ092462,rev_exon1,5946,6024,5969,6045,forward,0.5769230769230769,MAGRSGDSDEELLKAVRLIKFLYQSS,MAGRSGDSDEELLKAVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGT +OQ092462,vpu,6038,6284,6061,6310,forward,0.7073170731707319,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*,ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG +OQ092462,env,6201,8844,6224,8795,forward,0.5698598130841122,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*DGWQGVKNEGMGCCKGKNEAN*,ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAAGATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAA +OQ092462,tat_exon2,8359,8455,8376,8469,forward,0.4866666666666659,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH**,AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA +OQ092462,rev_exon2,8360,8636,8377,8653,forward,0.39560439560439553,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*,GACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092462,nef,8779,9406,8796,9417,forward,0.7422764227642202,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*,ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA +OQ092464,gag,773,2282,200,1700,forward,0.38588709677419364,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAGCCAGCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATCGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCGCTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTAAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCTCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAG +OQ092464,pol,2068,5080,1492,4504,forward,0.1734795613160518,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAATACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAGAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGTAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAGACTACCCATACAAAGAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAGACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGACGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAGAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092464,vif,5024,5603,4448,5027,forward,0.29166666666666674,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTACTCATCCAAGAATAAGTTCAGAAGTTCACATCCCGCTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAGAAGAGATATAGCACACAAGTAGACCCTGGCTTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGCTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092464,vpr,5542,5833,4966,5257,forward,0.20833333333333326,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092464,tat_exon1,5813,6032,5237,5452,forward,0.25,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA +OQ092464,rev_exon1,5952,6030,5376,5452,forward,0.5769230769230769,MAGRSGDSDEELLQTVRLIKLLYQSS,MAGRSGDSDEELLQTVRLIKLLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT +OQ092464,vpu,6044,6290,5468,5708,forward,0.4265822784810127,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL*,ATGCAACCTTTACACATAGCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAG +OQ092464,env,6207,8790,5631,8208,forward,0.5058275058275068,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATAATACCACTAGTACCAATGATACCACTAGTACCACTACTAGTAGCGGGGAAAAGATGAAGGAAGGAGAGATAAAAAACTGCTCTTTCAATATCACCACAAGCATAAGAGATAAGGTGCAGAAAGAATATGCACTCTTTTATAAACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACGATAAGAAGTTCAATGGAACAGGATCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAATGAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAAGACAATAATCTTTACTCACTCCTCAGGAGGGGACCCAGAAGTTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGATGAAAGGTCAAATGACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGATACATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAACGAGAGCAACACCACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAAAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGGATAACATGACCTGGATGGAATGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACTTTAATTGAAAAATCGCAAAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092464,tat_exon2,8371,8467,7789,7882,forward,3.5,RPTSQPRGDPTGQKESKKKVERETETDPDH,RPTSQPRGDPTGQKESKKKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092464,rev_exon2,8372,8648,7790,8066,forward,0.3846153846153846,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092464,nef,8791,9412,8209,8842,forward,0.3542857142857141,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAGAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGATGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGGTATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGGTTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092467,gag,808,2308,789,2292,forward,0.24380000000000002,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAAAAACAATACAAATTAAAACATCTAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTTCTAGAGACATCAGAAGGGTGTAGACAAATACTGGGACAGCTACAACCAGCTCTTCAGACAGGATCAGAAGAATTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAAATAGAGGAAGAGCAAAACCAAAGTAAGAAAAAAGCAGCAGCTGCAGCAGCTGACACAGGAAACAGAAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCTTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAATAGGTGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAGGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATTCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTGAGAGCCGAGCAAGCAACACAGGAAGTAAAGAATTGGATGACAGAAACTTTGCTGGTCCAAAATGCAAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCAGGCCACAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAACTGTAATGATGCAGAGAGGCAATTTTAGGAATCAAAGAAAGACAGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCATATAGCAAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAAAGAAGGGCACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092467,pol,2100,5112,2084,5096,forward,0.14356929212362912,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAAATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGATATGAATTTACCAGGAAAATGGAAACCAAAAATGATAGGAGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGCTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCGCATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCCTATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTACACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGGATATTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTGGGATCTGACTTAGAAATAGGACAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAAAGCTGCCAGAAAAAGATAGCTGGACTGTCAATGACATCCAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGAATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACTAAAGCACTAACAGAAGTAGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCAACGAAAGACCTAATAGCAGAACTACAGAAGCAGGGGCAAAGTCAATGGACATATCAAATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGGGGTGCCCACACTAATGATGTGAAACAATTAACAGAGGCAGTGCAAAAAATAGCCATAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAAATTACCTATACAAAAAGAAACATGGGAAACATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGATTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAAAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAGATCAGGCAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCCCCCTAACAGACACAACAAACCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTGACAGACTCACAATATGCACTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGGAAGATACTATTTTTAGATGGAATAACTAAGGCCCAAGATGATCATGAGAGATACCACAGCAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTATAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCACGCATGGACAAGTAGACTGCAGTCCAGGAATATGGCAACTAGATTGTACGCATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTAAAACTAGCAGGAAGATGGCCAGTAAAGACAGTACATACAGATAATGGCAGCAATTTCACCAGTGCTGCGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAAAGTCAAGGAGTCATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAGAAACAAATCACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAGGCAAAGATCATTAGAGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092467,vif,5056,5644,5040,5619,forward,0.43229166666666674,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*SF*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATACATGTCTCAAAGAAAGCTAAGGGATGGGTTTATAGACACCACTATGAAAGCACCCATCCAAGAATAAGTTCAGAAGTACATATCCCGCTAGGGGAAGCTAGATTAGTAATAGCAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAAGAAATATATCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGCATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCATAGTAGGACGTTTAGTTAGCCCTCAGTGTGAATATCAAACAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGTAGCATTAATAACGCCAAAAAAGAGAAAGCCACCTTTGCCTAGTGTTAGGAAATTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAG +OQ092467,vpr,5574,5868,5558,5850,forward,0.4807692307692313,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*T,ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAGACT +OQ092467,tat_exon1,5845,6064,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTCTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAA +OQ092467,rev_exon1,5984,6065,5969,6045,forward,0.6346153846153846,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG +OQ092467,vpu,6076,6340,6061,6310,forward,0.5439024390243903,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*,ATGCAACCCTTAGTAATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAGAAAGATAGATAGCATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG +OQ092467,env,6239,8807,6224,8795,forward,0.49988317757009404,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092467,tat_exon2,8388,8484,8376,8469,forward,0.886666666666666,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN**,AGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGA +OQ092467,rev_exon2,8389,8674,8377,8653,forward,0.38351648351648326,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*,GACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAG +OQ092467,nef,8808,9417,8796,9417,forward,0.6048780487804808,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*,ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA diff --git a/tests/expected-results-large/orfs.json b/tests/expected-results-large/orfs.json index 3e1686b..661921e 100644 --- a/tests/expected-results-large/orfs.json +++ b/tests/expected-results-large/orfs.json @@ -2,9 +2,11 @@ "KX505501.1": [ { "name": "env", - "orientation": "forward", "start": 0, "end": 1824, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.9898364485981306, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", @@ -12,9 +14,11 @@ }, { "name": "gag", - "orientation": "forward", "start": 336, "end": 1824, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.3622000000000025, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", @@ -22,9 +26,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 1306, "end": 1927, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 2.1463541666666663, "protein": "MRTQIVKLF", "aminoacids": "MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -32,9 +38,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 1306, "end": 1927, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 2.1430894308943085, "protein": "MRTQIVKLF", "aminoacids": "MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -42,9 +50,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1628, "end": 1748, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 2.1349950149551358, "protein": "FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN", "aminoacids": "FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN*", @@ -52,9 +62,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 1746, "end": 1824, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 2.12, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "RCIRSTTRTADTELFTRDFPLGTFQ*", @@ -62,9 +74,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 1747, "end": 1927, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 2.098780487804878, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -72,9 +86,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 1747, "end": 1927, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 1.9802197802197803, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -82,9 +98,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 2.1884615384615382, "protein": "M", "aminoacids": "M", @@ -92,9 +110,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.1875, "protein": "M", "aminoacids": "M", @@ -102,9 +122,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.1653846153846152, "protein": "M", "aminoacids": "M", @@ -114,9 +136,11 @@ "MN691959": [ { "name": "gag", - "orientation": "forward", "start": 639, "end": 2142, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.05400000000000005, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*", @@ -124,9 +148,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1934, "end": 4946, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.03589232303090717, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -134,9 +160,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4890, "end": 5469, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.0625, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -144,9 +172,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5408, "end": 5702, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.21153846153845945, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T", @@ -154,9 +184,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5679, "end": 5895, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", @@ -164,9 +196,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5818, "end": 5896, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSS", "aminoacids": "MAGRSGDSDEDLLKTVRLIKFLYQSS", @@ -174,9 +208,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5910, "end": 6156, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7060975609756097, "protein": "SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL", "aminoacids": "MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*", @@ -184,9 +220,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6070, "end": 8683, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.0867990654205606, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK*", @@ -194,9 +232,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8237, "end": 8333, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.19999999999999996, "protein": "RPTSQTRGDPTGPKE", "aminoacids": "RPTSQTRGDPTGPKE*KKKVERETETDPFD**", @@ -204,9 +244,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8238, "end": 8514, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.16483516483516492, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", "aminoacids": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*", @@ -214,9 +256,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8657, "end": 9278, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.16991869918698432, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", @@ -226,9 +270,11 @@ "MN692074": [ { "name": "env", - "orientation": "forward", "start": 2, "end": 4115, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.9582943925233647, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -236,9 +282,11 @@ }, { "name": "gag", - "orientation": "forward", "start": 789, "end": 2292, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.13880000000000003, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*", @@ -246,9 +294,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2084, "end": 4115, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.7912263210369039, "protein": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -256,9 +306,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 3617, "end": 4115, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 1.9968750000000002, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -266,9 +318,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 3617, "end": 4085, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 1.9602564102564104, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT", @@ -276,9 +330,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 3617, "end": 4115, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 1.965040650406504, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -286,9 +342,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 3823, "end": 4084, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.0305555555555554, "protein": "MVPVRERTHSRSRNLLCRWGS", "aminoacids": "MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY", @@ -296,9 +354,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 3823, "end": 4084, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.0153846153846153, "protein": "MVPVRERTHSRSRNLLCRWGS", "aminoacids": "MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY", @@ -306,9 +366,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 2.09390243902439, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -316,9 +378,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 2.1133333333333333, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -326,9 +390,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 2.065934065934066, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -338,9 +404,11 @@ "MN692145": [ { "name": "gag", - "orientation": "forward", "start": 775, "end": 2287, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.15900000000000003, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*", @@ -348,9 +416,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2070, "end": 5085, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.10618145563310066, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*", @@ -358,9 +428,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5029, "end": 5608, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.21875, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*", @@ -368,9 +440,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5547, "end": 5841, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44358974358974423, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T", @@ -378,9 +452,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5818, "end": 6037, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", "aminoacids": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*", @@ -388,9 +464,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5957, "end": 6038, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5192307692307692, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -398,9 +476,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6049, "end": 6298, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.5804878048780489, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", @@ -408,9 +488,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6212, "end": 8783, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4975467289719626, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", @@ -418,9 +500,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8364, "end": 8460, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", "aminoacids": "RPASQPRGDPTGPKESKKKVERETETDPLH**", @@ -428,9 +512,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8365, "end": 8641, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.2637362637362637, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", "aminoacids": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*", @@ -438,9 +524,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8784, "end": 9576, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.3878048780487735, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*", @@ -450,9 +538,11 @@ "MN090335": [ { "name": "gag", - "orientation": "forward", "start": 315, "end": 1665, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.8911999999999998, "protein": "MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ", "aminoacids": "MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*", @@ -460,9 +550,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1427, "end": 4469, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.2169491525423728, "protein": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -470,9 +562,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4413, "end": 5001, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.34375, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF*", @@ -480,9 +574,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4931, "end": 5225, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5192307692307698, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T", @@ -490,9 +586,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5202, "end": 5418, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.45833333333333326, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", @@ -500,9 +598,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5341, "end": 5419, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6923076923076923, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSS", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSS", @@ -510,9 +610,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5433, "end": 5682, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6560975609756099, "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", "aminoacids": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*", @@ -520,9 +622,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5596, "end": 8158, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.6022196261682247, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", "aminoacids": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*", @@ -530,9 +634,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7739, "end": 7835, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.3999999999999999, "protein": "RPSSQPRGDQTGPKE", "aminoacids": "RPSSQPRGDQTGPKE*KKKVERETEADPED**", @@ -540,9 +646,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7740, "end": 8016, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.46153846153846145, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", "aminoacids": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*", @@ -550,9 +658,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8159, "end": 8819, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5260162601625942, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", "aminoacids": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H*", @@ -562,9 +672,11 @@ "MN090376": [ { "name": "gag", - "orientation": "forward", "start": 376, "end": 1639, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 2.1734000000000018, "protein": "MQTQIVRPF", "aminoacids": "MFCTIG*FWLTWLLFPGSAAACCVFFLLLFCSSSILSKASLVSFISIL*CTQ*RTATVLNNDLSSSDPV*SAGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTICFNLYLFFPPGLNRIFSHLSNSPPLNTDALAPISLLLASASQKGVLTVRRPSPLAVRASASRVR*FWD*IK**ECIVLPAFWT*DKDQRNPLETM*IGSIKL*EPSKLHRR*KIG*QKPCWSRMQTQIVRPF*KHWVQQLH*KK**QHAREWEDPAIRQEFWRKQ*AK*QTQLP**CRKAILGAKERWLSVSIVAKKGT*PEIAGPLGKGAVGNVERKDTK*KIVLRDRQIF*GKSGLPTRGGQGTFLKAEQNQQPHQRRASVLGRRQQLLLRSRSR*TRNYTLCLPSNHSLATTLSHSKDRGATKGSSIRYRSR*", @@ -572,9 +684,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1382, "end": 4394, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.18823529411764706, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", "aminoacids": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*", @@ -582,9 +696,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4338, "end": 4929, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.41770833333333335, "protein": "MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH", "aminoacids": "MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*NF*", @@ -592,9 +708,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4859, "end": 5153, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44230769230769296, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T", @@ -602,9 +720,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5130, "end": 5346, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5833333333333333, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", @@ -612,9 +732,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5269, "end": 5347, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.723076923076923, "protein": "MAGRSGDSDEELLRIAGTIKFLYQSS", "aminoacids": "MAGRSGDSDEELLRIAGTIKFLYQSS", @@ -622,9 +744,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5361, "end": 5631, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7073170731707319, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL", "aminoacids": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*", @@ -632,9 +756,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5524, "end": 8137, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5484813084112157, "protein": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", "aminoacids": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT*", @@ -642,9 +768,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7691, "end": 7784, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", "aminoacids": "RPSSQPRGDPTGPKESEKKVERETETDPVT*", @@ -652,9 +780,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7692, "end": 7968, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.46153846153846145, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", "aminoacids": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*", @@ -662,9 +792,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8111, "end": 8735, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6943089430894234, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", "aminoacids": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*", @@ -674,9 +806,11 @@ "MK115581.1": [ { "name": "gag", - "orientation": "forward", "start": 680, "end": 2186, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -684,9 +818,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1972, "end": 4984, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -694,9 +830,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4928, "end": 5507, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -704,9 +842,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5446, "end": 5740, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -714,9 +854,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5717, "end": 5936, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -724,9 +866,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5856, "end": 5934, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -734,9 +878,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5948, "end": 6194, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -744,9 +890,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6111, "end": 8652, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -754,9 +902,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8233, "end": 8329, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -764,9 +914,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8234, "end": 8519, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -774,9 +926,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8653, "end": 9274, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -786,9 +940,11 @@ "MK115690.1": [ { "name": "gag", - "orientation": "forward", "start": 777, "end": 2292, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.1894, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*R*", @@ -796,9 +952,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2078, "end": 5090, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.13958125623130613, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -806,9 +964,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5034, "end": 5622, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.40104166666666674, "protein": "MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*SF*", @@ -816,9 +976,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5552, "end": 5846, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5576923076923082, "protein": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS", "aminoacids": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*S", @@ -826,9 +988,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5823, "end": 6039, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.45833333333333326, "protein": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", "aminoacids": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", @@ -836,9 +1000,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5962, "end": 6040, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6923076923076923, "protein": "MAGRSGDNDEDLLKTVRFIKLLYQSS", "aminoacids": "MAGRSGDNDEDLLKTVRFIKLLYQSS", @@ -846,9 +1012,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6054, "end": 6300, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.552439024390244, "protein": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL", "aminoacids": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*", @@ -856,9 +1024,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6217, "end": 8800, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5558411214953274, "protein": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ", "aminoacids": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*", @@ -866,9 +1036,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8381, "end": 8489, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKEPETKVESKTETDPLT", "aminoacids": "RPTSQPRGDPTGPKEPETKVESKTETDPLT*WMDS*", @@ -876,9 +1048,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8382, "end": 8658, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4505494505494505, "protein": "DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*", @@ -886,9 +1060,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8801, "end": 9425, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6089430894308867, "protein": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN", "aminoacids": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*", @@ -898,9 +1074,11 @@ "MK115571.1": [ { "name": "gag", - "orientation": "forward", "start": 579, "end": 2079, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*", @@ -908,9 +1086,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1871, "end": 4883, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -918,9 +1098,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4827, "end": 5406, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -928,9 +1110,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5345, "end": 5639, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -938,9 +1122,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5616, "end": 5832, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -948,9 +1134,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5755, "end": 5833, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -958,9 +1146,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5847, "end": 6093, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -968,9 +1158,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6010, "end": 8551, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49065420560747675, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -978,9 +1170,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8132, "end": 8228, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -988,9 +1182,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8133, "end": 8418, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -998,9 +1194,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8552, "end": 9173, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -1010,9 +1208,11 @@ "MK115514.1": [ { "name": "gag", - "orientation": "forward", "start": 584, "end": 2090, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -1020,9 +1220,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1876, "end": 4888, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14456630109670976, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -1030,9 +1232,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4832, "end": 5411, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -1040,9 +1244,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5350, "end": 5644, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -1050,9 +1256,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5621, "end": 5840, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -1060,9 +1268,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5760, "end": 5838, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -1070,9 +1280,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5852, "end": 6098, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -1080,9 +1292,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6015, "end": 8556, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4941588785046729, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -1090,9 +1304,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8137, "end": 8233, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -1100,9 +1316,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8138, "end": 8423, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -1110,9 +1328,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8557, "end": 9178, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -1122,9 +1342,11 @@ "MK115488.1": [ { "name": "gag", - "orientation": "forward", "start": 707, "end": 2213, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -1132,9 +1354,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1999, "end": 5011, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14456630109670976, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -1142,9 +1366,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4955, "end": 5534, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -1152,9 +1378,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5473, "end": 5767, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -1162,9 +1390,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5744, "end": 5963, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -1172,9 +1402,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5883, "end": 5961, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -1182,9 +1414,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5975, "end": 6221, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -1192,9 +1426,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6138, "end": 8679, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4941588785046729, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -1202,9 +1438,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8260, "end": 8356, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -1212,9 +1450,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8261, "end": 8546, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -1222,9 +1462,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8680, "end": 9301, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -1234,9 +1476,11 @@ "MK115030.1": [ { "name": "gag", - "orientation": "forward", "start": 176, "end": 1685, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.22580000000000022, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", "aminoacids": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*", @@ -1244,9 +1488,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1477, "end": 4567, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.21934197407776668, "protein": "FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL*", @@ -1254,9 +1500,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4433, "end": 5012, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.38020833333333326, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*", @@ -1264,9 +1512,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4951, "end": 5245, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5192307692307698, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L", @@ -1274,9 +1524,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5222, "end": 5441, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5972222222222223, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*", @@ -1284,9 +1536,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5361, "end": 5439, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6538461538461537, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", @@ -1294,9 +1548,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5453, "end": 5699, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.780487804878049, "protein": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM", "aminoacids": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*", @@ -1304,9 +1560,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5616, "end": 8217, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5768691588785053, "protein": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*", @@ -1314,9 +1572,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7798, "end": 7891, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", "aminoacids": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD*", @@ -1324,9 +1584,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7799, "end": 8075, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", "aminoacids": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*", @@ -1334,9 +1596,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8218, "end": 8866, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.7959349593495859, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*", @@ -1346,9 +1610,11 @@ "MK115498.1": [ { "name": "gag", - "orientation": "forward", "start": 663, "end": 2169, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -1356,9 +1622,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1955, "end": 4967, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -1366,9 +1634,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4911, "end": 5490, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -1376,9 +1646,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5429, "end": 5723, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -1386,9 +1658,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5700, "end": 5916, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1396,9 +1670,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5839, "end": 5917, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -1406,9 +1682,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5931, "end": 6177, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -1416,9 +1694,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6094, "end": 8635, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -1426,9 +1706,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8216, "end": 8312, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -1436,9 +1718,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8217, "end": 8502, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -1446,9 +1730,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8636, "end": 9257, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -1458,9 +1744,11 @@ "MK115211.1": [ { "name": "gag", - "orientation": "forward", "start": 250, "end": 1753, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.1938000000000002, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*", @@ -1468,9 +1756,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1545, "end": 4557, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.20219341974077754, "protein": "FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED", "aminoacids": "FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED*", @@ -1478,9 +1768,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4501, "end": 5083, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.39687499999999987, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH", "aminoacids": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH*", @@ -1488,9 +1780,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5022, "end": 5316, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4807692307692313, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*T", @@ -1498,9 +1792,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5293, "end": 5512, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5694444444444444, "protein": "MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*", @@ -1508,9 +1804,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5432, "end": 5513, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.7115384615384615, "protein": "MAGRSGDSDEELLRITRTIKFLYQNSE", "aminoacids": "MAGRSGDSDEELLRITRTIKFLYQNSE", @@ -1518,9 +1816,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5524, "end": 5794, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7439024390243905, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL", "aminoacids": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*", @@ -1528,9 +1828,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5687, "end": 8198, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.2061915887850478, "protein": "MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", "aminoacids": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*", @@ -1538,9 +1840,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7779, "end": 7872, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", "aminoacids": "RPSSQPRGDPTGPKESEKKVERETETDPVT*", @@ -1548,9 +1852,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7780, "end": 8056, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.46153846153846145, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", "aminoacids": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*", @@ -1558,9 +1864,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8199, "end": 8838, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6943089430894234, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC", "aminoacids": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAF*", @@ -1570,9 +1878,11 @@ "MK115158.1": [ { "name": "gag", - "orientation": "forward", "start": 316, "end": 1819, + "subtype_start": 234, + "subtype_end": 1731, + "orientation": "forward", "distance": 0.3517171717171721, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ*", @@ -1580,9 +1890,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1611, "end": 4623, + "subtype_start": 1526, + "subtype_end": 4535, + "orientation": "forward", "distance": 0.26447105788423153, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", "aminoacids": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*", @@ -1590,9 +1902,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4567, "end": 5149, + "subtype_start": 4479, + "subtype_end": 5061, + "orientation": "forward", "distance": 0.5668393782383419, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH", "aminoacids": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH*", @@ -1600,9 +1914,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5088, "end": 5379, + "subtype_start": 5000, + "subtype_end": 5291, + "orientation": "forward", "distance": 0.46875, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*", @@ -1610,9 +1926,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5359, "end": 5578, + "subtype_start": 5271, + "subtype_end": 5486, + "orientation": "forward", "distance": 0.5416666666666667, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*", @@ -1620,9 +1938,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5498, "end": 5579, + "subtype_start": 5410, + "subtype_end": 5486, + "orientation": "forward", "distance": 0.75, "protein": "MAGRSGDSDEELLKITRTIKFLYQNSE", "aminoacids": "MAGRSGDSDEELLKITRTIKFLYQNSE", @@ -1630,9 +1950,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5590, "end": 5860, + "subtype_start": 5502, + "subtype_end": 5748, + "orientation": "forward", "distance": 0.5308641975308646, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL", "aminoacids": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL*", @@ -1640,9 +1962,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5753, "end": 8342, + "subtype_start": 5665, + "subtype_end": 8212, + "orientation": "forward", "distance": 0.5740566037735857, "protein": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", "aminoacids": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*NGRHILKT*", @@ -1650,9 +1974,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7896, "end": 7992, + "subtype_start": 7793, + "subtype_end": 7886, + "orientation": "forward", "distance": 0.6935483870967742, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", "aminoacids": "RPSSQPRGDPTGPKESEKKVERETETDPVT*R", @@ -1660,9 +1986,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7897, "end": 8173, + "subtype_start": 7794, + "subtype_end": 8070, + "orientation": "forward", "distance": 0.5274725274725274, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE", "aminoacids": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE*", @@ -1670,9 +1998,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8316, "end": 8994, + "subtype_start": 8213, + "subtype_end": 8834, + "orientation": "forward", "distance": 0.6674757281553398, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", "aminoacids": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*QRAFYKGLSARDFPGEA*", @@ -1682,9 +2012,11 @@ "MK114705.1": [ { "name": "gag", - "orientation": "forward", "start": 532, "end": 2053, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.21479999999999988, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*R*", @@ -1692,9 +2024,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1839, "end": 4851, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.17248255234297116, "protein": "FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -1702,9 +2036,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4795, "end": 5383, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.34375, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*NF*", @@ -1712,9 +2048,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5313, "end": 5601, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.46153846153846234, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS", "aminoacids": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*T", @@ -1722,9 +2060,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5578, "end": 5797, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6222222222222225, "protein": "MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*", @@ -1732,9 +2072,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5717, "end": 5798, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.8653846153846154, "protein": "MAGRSGDRDEDLLETVRFIKFLYQNSK", "aminoacids": "MAGRSGDRDEDLLETVRFIKFLYQNSK", @@ -1742,9 +2084,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5809, "end": 6055, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7963414634146342, "protein": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL", "aminoacids": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*", @@ -1752,9 +2096,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5972, "end": 8549, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5660046728971964, "protein": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL", "aminoacids": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*", @@ -1762,9 +2108,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8130, "end": 8226, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.9733333333333327, "protein": "RPPAQPQGDPTGPKKSKKEVEKETETDQCD", "aminoacids": "RPPAQPQGDPTGPKKSKKEVEKETETDQCD**", @@ -1772,9 +2120,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8131, "end": 8407, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.5494505494505495, "protein": "DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE", "aminoacids": "DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*", @@ -1782,9 +2132,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8550, "end": 9138, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.4593495934959331, "protein": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK", "aminoacids": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*CVPVCCVTLVTRDPSDHFSQRGKSLAVAPEQGPESESRTRGDLSTQDSAC*", @@ -1794,9 +2146,11 @@ "MK114856.1": [ { "name": "gag", - "orientation": "forward", "start": 120, "end": 2022, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 1.871000000000001, "protein": "MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC", "aminoacids": "MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ*", @@ -1804,9 +2158,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1787, "end": 4892, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 2.003988035892324, "protein": "ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI", "aminoacids": "FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*NMEKFSKIPYVYFKESQEIGL*", @@ -1814,9 +2170,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4791, "end": 5349, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 1.928125, "protein": "MIVWQVDRMKIRTWKSLVKYHMYISKKAKK", "aminoacids": "MIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH*", @@ -1824,9 +2182,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5033, "end": 5582, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 2.052564102564103, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", "aminoacids": "MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*T", @@ -1834,9 +2194,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5427, "end": 5775, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.1097222222222225, "protein": "MKLIKILGQE", "aminoacids": "MKLIKILGQE*KP**EFCNKCCLFISELSVTIAE*ALFCKEEQEIEPVDHRLEP*KHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", @@ -1844,9 +2206,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5698, "end": 5776, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6923076923076923, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSS", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSS", @@ -1854,9 +2218,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5790, "end": 6039, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 1.3926829268292686, "protein": "TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP", "aminoacids": "MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*", @@ -1864,9 +2230,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5953, "end": 8557, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.8896028037383144, "protein": "MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD", "aminoacids": "MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*NKWQVVKKLYG*", @@ -1874,9 +2242,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8102, "end": 8198, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.8, "protein": "RPSSQPQEDQTGPKE", "aminoacids": "RPSSQPQEDQTGPKE*KKKVKRETEADPED**", @@ -1884,9 +2254,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8103, "end": 8379, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 1.3725274725274725, "protein": "ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE", "aminoacids": "DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*", @@ -1894,9 +2266,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8549, "end": 9176, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 2.0414634146341464, "protein": "MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", "aminoacids": "MAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*", @@ -1906,9 +2280,11 @@ "MK115009.1": [ { "name": "gag", - "orientation": "forward", "start": 302, "end": 1715, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 1.8444000000000005, "protein": "MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC", "aminoacids": "MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*", @@ -1916,9 +2292,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1613, "end": 4703, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 1.89531405782652, "protein": "AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED", "aminoacids": "FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL*", @@ -1926,9 +2304,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4590, "end": 5148, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 2.064583333333333, "protein": "MIVWQVDRMRIRT", "aminoacids": "MIVWQVDRMRIRT*NSLVKHHMHISKKAQR*VYRHHYESHNPKTSSEVHIPLEEARLVIKTY*GLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTINGH*", @@ -1936,9 +2316,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5087, "end": 5381, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 1.0679487179487188, "protein": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT", "aminoacids": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*L", @@ -1946,9 +2328,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5412, "end": 5574, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 1.0958333333333334, "protein": "MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", "aminoacids": "MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", @@ -1956,9 +2340,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5497, "end": 5575, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.7692307692307692, "protein": "MAGRSRDSDEELLTAVRIIKRLYQSS", "aminoacids": "MAGRSRDSDEELLTAVRIIKRLYQSS", @@ -1966,9 +2352,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5589, "end": 5835, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.9975609756097563, "protein": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP", "aminoacids": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*", @@ -1976,9 +2364,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5752, "end": 8353, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.878154205607472, "protein": "MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD", "aminoacids": "MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*", @@ -1986,9 +2376,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7934, "end": 8027, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.6866666666666661, "protein": "RPSSQPREDPTGPKEQKKEVERKTEAHPRD", "aminoacids": "RPSSQPREDPTGPKEQKKEVERKTEAHPRD*", @@ -1996,9 +2388,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7935, "end": 8211, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 1.3065934065934066, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE", "aminoacids": "DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*", @@ -2006,9 +2400,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8609, "end": 8996, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 1.6390243902439028, "protein": "MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR", "aminoacids": "MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*", @@ -2018,9 +2414,11 @@ "MK115387.1": [ { "name": "gag", - "orientation": "forward", "start": 292, "end": 1795, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.20799999999999996, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*", @@ -2028,9 +2426,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1587, "end": 4599, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.13160518444665992, "protein": "FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -2038,9 +2438,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4543, "end": 5122, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.3041666666666665, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH*", @@ -2048,9 +2450,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5061, "end": 5355, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*I", @@ -2058,9 +2462,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5332, "end": 5551, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.41666666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*", @@ -2068,9 +2474,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5471, "end": 5552, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6346153846153846, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", @@ -2078,9 +2486,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5563, "end": 5809, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7682926829268295, "protein": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL", "aminoacids": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*", @@ -2088,9 +2498,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5726, "end": 8288, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.6280373831775696, "protein": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL", "aminoacids": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*", @@ -2098,9 +2510,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7869, "end": 7965, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.6000000000000001, "protein": "RPSSQLRGEPTGPKE", "aminoacids": "RPSSQLRGEPTGPKE*KKEVERETKADPVD**", @@ -2108,9 +2522,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7870, "end": 8146, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.29670329670329676, "protein": "DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE", "aminoacids": "DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*", @@ -2118,9 +2534,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8289, "end": 8940, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5162601626016183, "protein": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", "aminoacids": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*", @@ -2130,9 +2548,11 @@ "MK115491.1": [ { "name": "gag", - "orientation": "forward", "start": 521, "end": 2027, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -2140,9 +2560,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1813, "end": 4825, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -2150,9 +2572,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4769, "end": 5348, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -2160,9 +2584,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5287, "end": 5581, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -2170,9 +2596,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5558, "end": 5777, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -2180,9 +2608,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5697, "end": 5775, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -2190,9 +2620,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5789, "end": 6035, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -2200,9 +2632,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5952, "end": 8493, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -2210,9 +2644,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8074, "end": 8170, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -2220,9 +2656,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8075, "end": 8360, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -2230,9 +2668,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8494, "end": 9115, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -2242,9 +2682,11 @@ "MK116110.1": [ { "name": "gag", - "orientation": "forward", "start": 0, "end": 1557, + "subtype_start": 140, + "subtype_end": 1643, + "orientation": "forward", "distance": 2.1186000000000007, "protein": "MVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA", "aminoacids": "PESESRTREVLSTQDSAC*ALWPGPPTP*HAVIISSSVAAGPNAFKIVLQSGFAFWTNKVSVIQFFTSCEACSALRVL*NRST*SLKGSFGPCFMSKMLTGLYILTILFNPRITHLL*ISPTGIGGLFVIHPICS*RVLVVPAISLPLGSLIWPGATGPACTGCNLSHSAASSLMVSFNICIAA*CPPTVFSMVFISCGVAPSANAENIGITSGLKAFSSTTFTHAFKVLGDMA*CTICPWRFCTIG*FWLTWLLFPAPAAACCAFILLLFCSSSILSSAPLVSCISIL*CIQ*RTATVLYNDLSSSDPVWRDGCSCPSICLQPSDVSNRPGLTANRSSSLLAHTRCFNLYFFFPPGLNRIFSHWSNFPPLNTDALAPISLLLASAR*KLFWRTHQSPKQ*AK*IQLP**CRKAILGTKRRLLSVSTVVK*GI*QKIAGPPGERAVGNVDRKDTR*KIVVRDRLIF*GNSGLPTRGGQGISFRADQSQQPHQRRASGLGKRQQLPLRSRSR*TGNYIP*", @@ -2252,9 +2694,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1393, "end": 4405, + "subtype_start": 1435, + "subtype_end": 4447, + "orientation": "forward", "distance": 0.19680957128614174, "protein": "FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED", "aminoacids": "FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED*", @@ -2262,9 +2706,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4349, "end": 4928, + "subtype_start": 4391, + "subtype_end": 4970, + "orientation": "forward", "distance": 0.546875, "protein": "MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH", "aminoacids": "MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH*", @@ -2272,9 +2718,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4867, "end": 5158, + "subtype_start": 4909, + "subtype_end": 5200, + "orientation": "forward", "distance": 0.48333333333333317, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP", "aminoacids": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP*", @@ -2282,9 +2730,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5138, "end": 5357, + "subtype_start": 5180, + "subtype_end": 5395, + "orientation": "forward", "distance": 0.6111111111111112, "protein": "MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ", "aminoacids": "MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ*", @@ -2292,9 +2742,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5277, "end": 5355, + "subtype_start": 5319, + "subtype_end": 5395, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEDLLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEDLLKAVRLIKILYQSS", @@ -2302,9 +2754,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5369, "end": 5615, + "subtype_start": 5411, + "subtype_end": 5657, + "orientation": "forward", "distance": 0.48124999999999996, "protein": "MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL", "aminoacids": "MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL*", @@ -2312,9 +2766,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5532, "end": 8073, + "subtype_start": 5574, + "subtype_end": 8124, + "orientation": "forward", "distance": 0.5259128386336873, "protein": "MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL", "aminoacids": "MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL*", @@ -2322,9 +2778,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7654, "end": 7750, + "subtype_start": 7705, + "subtype_end": 7798, + "orientation": "forward", "distance": 0.5, "protein": "RPASQPRGDPTGPKESKKTVERETETDPHA", "aminoacids": "RPASQPRGDPTGPKESKKTVERETETDPHA**", @@ -2332,9 +2790,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7655, "end": 7940, + "subtype_start": 7706, + "subtype_end": 7982, + "orientation": "forward", "distance": 0.48241758241758226, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC", "aminoacids": "DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC*", @@ -2342,9 +2802,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8074, "end": 8695, + "subtype_start": 8125, + "subtype_end": 8752, + "orientation": "forward", "distance": 0.4668269230769231, "protein": "MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC", "aminoacids": "MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC*", @@ -2354,9 +2816,11 @@ "MK115527.1": [ { "name": "gag", - "orientation": "forward", "start": 683, "end": 2189, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -2364,9 +2828,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1975, "end": 4987, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -2374,9 +2840,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4931, "end": 5510, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -2384,9 +2852,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5449, "end": 5743, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -2394,9 +2864,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5720, "end": 5939, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -2404,9 +2876,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5859, "end": 5937, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -2414,9 +2888,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5951, "end": 6197, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -2424,9 +2900,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6114, "end": 8655, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -2434,9 +2912,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8236, "end": 8332, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -2444,9 +2924,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8237, "end": 8522, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -2454,9 +2936,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8656, "end": 9277, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -2466,9 +2950,11 @@ "MK114997.1": [ { "name": "gag", - "orientation": "forward", "start": 210, "end": 1725, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.22980000000000023, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP", "aminoacids": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*E*", @@ -2476,9 +2962,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1511, "end": 4601, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.21934197407776668, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMGLQTSL*", @@ -2486,9 +2974,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4467, "end": 5046, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.38020833333333326, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*", @@ -2496,9 +2986,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4985, "end": 5279, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44230769230769296, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L", @@ -2506,9 +2998,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5256, "end": 5472, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5694444444444444, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -2516,9 +3010,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5395, "end": 5473, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6538461538461537, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", @@ -2526,9 +3022,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5487, "end": 5733, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.751219512195122, "protein": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", "aminoacids": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*", @@ -2536,9 +3034,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5762, "end": 8216, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.2265186915887858, "protein": "MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*DG*", @@ -2546,9 +3046,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7788, "end": 7881, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", "aminoacids": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD*", @@ -2556,9 +3058,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7789, "end": 8065, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", "aminoacids": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*", @@ -2566,9 +3070,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8208, "end": 8856, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.7959349593495859, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC", "aminoacids": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*H*", @@ -2578,9 +3084,11 @@ "MK115518.1": [ { "name": "gag", - "orientation": "forward", "start": 739, "end": 2245, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -2588,9 +3096,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2031, "end": 5043, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -2598,9 +3108,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4987, "end": 5566, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -2608,9 +3120,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5505, "end": 5799, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -2618,9 +3132,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5776, "end": 5995, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -2628,9 +3144,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5915, "end": 5996, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6346153846153846, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -2638,9 +3156,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6007, "end": 6253, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -2648,9 +3168,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6170, "end": 8711, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49018691588785046, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -2658,9 +3180,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8292, "end": 8388, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -2668,9 +3192,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8293, "end": 8578, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -2678,9 +3204,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8712, "end": 9333, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -2690,9 +3218,11 @@ "MK115065.1": [ { "name": "gag", - "orientation": "forward", "start": 221, "end": 1736, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.24380000000000024, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", "aminoacids": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*K*", @@ -2700,9 +3230,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1522, "end": 4534, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.20438683948155534, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*", @@ -2710,9 +3242,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4478, "end": 5057, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.38020833333333326, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*", @@ -2720,9 +3254,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4996, "end": 5290, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4807692307692313, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*L", @@ -2730,9 +3266,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5267, "end": 5486, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5972222222222223, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*", @@ -2740,9 +3278,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5406, "end": 5484, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6538461538461537, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", @@ -2750,9 +3290,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5498, "end": 5744, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.751219512195122, "protein": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", "aminoacids": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*", @@ -2760,9 +3302,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5661, "end": 8262, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5663551401869167, "protein": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", "aminoacids": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*", @@ -2770,9 +3314,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7843, "end": 7936, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", "aminoacids": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD*", @@ -2780,9 +3326,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7844, "end": 8120, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", "aminoacids": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*", @@ -2790,9 +3338,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8263, "end": 8911, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.7471544715447078, "protein": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*", @@ -2802,9 +3352,11 @@ "MK115464.1": [ { "name": "gag", - "orientation": "forward", "start": 527, "end": 2297, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 1.495, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", "aminoacids": "MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*", @@ -2812,9 +3364,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2089, "end": 5101, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 1.8783649052841465, "protein": "AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED", "aminoacids": "FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED*", @@ -2822,9 +3376,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5045, "end": 5624, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 1.494270833333335, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY", "aminoacids": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH*", @@ -2832,9 +3388,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5563, "end": 5857, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5192307692307698, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", "aminoacids": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*I", @@ -2842,9 +3400,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5711, "end": 6053, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.118055555555556, "protein": "MRILGQE", "aminoacids": "MRILGQE*EP**EFCNNCCLFISELGANIAE*ASLDRGEQEIEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*", @@ -2852,9 +3412,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5973, "end": 6051, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSS", "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSS", @@ -2862,9 +3424,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6065, "end": 6347, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 1.3170731707317076, "protein": "AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP", "aminoacids": "MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*YCRPVVGHSLL*", @@ -2872,9 +3436,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6228, "end": 8826, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.8288551401869095, "protein": "MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST", "aminoacids": "MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*DRWQVVKK*", @@ -2882,9 +3448,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8380, "end": 8476, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.6000000000000001, "protein": "RPSSQPREEPTGPKE", "aminoacids": "RPSSQPREEPTGPKE*KKEVERETKADPVD**", @@ -2892,9 +3460,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8381, "end": 8657, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.8274725274725274, "protein": "RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE", "aminoacids": "DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*", @@ -2902,9 +3472,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 9064, "end": 9496, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 1.64878048780488, "protein": "MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", "aminoacids": "MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*HRAFHQGLSRRGVA*", @@ -2914,9 +3486,11 @@ "MK115530.1": [ { "name": "gag", - "orientation": "forward", "start": 746, "end": 2252, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -2924,9 +3498,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2038, "end": 5050, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -2934,9 +3510,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4994, "end": 5573, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -2944,9 +3522,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5512, "end": 5806, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -2954,9 +3534,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5783, "end": 6002, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -2964,9 +3546,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5922, "end": 6000, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -2974,9 +3558,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6014, "end": 6260, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -2984,9 +3570,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6177, "end": 8718, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4941588785046729, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -2994,9 +3582,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8299, "end": 8395, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3004,9 +3594,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8300, "end": 8585, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3014,9 +3606,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8719, "end": 9340, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5918699186991796, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3026,9 +3620,11 @@ "MK115520.1": [ { "name": "gag", - "orientation": "forward", "start": 695, "end": 2195, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*", @@ -3036,9 +3632,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1987, "end": 4915, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 1.3952143569292395, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDMGNGQYSL*YCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QR*YH*QKKQS*NWQKTGKF*ENQYMECIMTHQKT**QKYRSRAMDSGHIKFIKSHLKI*KQENMQE*GVPTLMM*NN*QRQYKR*PQKA**YGEKLLNLDYLYKKKHGRHGGQSTGKPPGFLSGSLSIPLP**NYGTN*RKNP**EQKLSM*MGQLIEKLN*AKQDMSLTEEDKRLSP*RTQQIKRLSYKQFI*LCRIRDQK*T**QTHNIH*ESFKHNQIRVNQS*SIR**SS**KRKKSTWHGYQHTKELEEMNK*TN*SVLESGEYYF*ME*IRPKKTMRNITVIGEQWLVILIYPL**QKK**PAVINVSKKERPCMDK*IVVQEYGN*IVHI*KGKLSW*QFM*PVDI*KQKLFQQRQGRKQHTFS*N*QGDGQ*KQYIQTMAAISPVMWLRPPVGGQGSSRNLAFPTIPKVKE**NP*IKN*RKL*DR*EIRLNILRQQYKWQYSSTILKEKGGLGGIVQGKE**I**QQTYKLKNYRNKLQKFKIFGFITGTAEIHFGKDQQSFSGKVKGQ**YKIIVI*K*", @@ -3046,9 +3644,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4948, "end": 5527, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3056,9 +3656,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5466, "end": 5760, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3066,9 +3668,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5737, "end": 5956, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -3076,9 +3680,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5876, "end": 5957, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6346153846153846, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3086,9 +3692,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5968, "end": 6214, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3096,9 +3704,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6131, "end": 8672, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49065420560747675, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3106,9 +3716,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8253, "end": 8349, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3116,9 +3728,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8254, "end": 8539, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3126,9 +3740,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8673, "end": 9294, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3138,9 +3754,11 @@ "MK115503.1": [ { "name": "gag", - "orientation": "forward", "start": 817, "end": 2323, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -3148,9 +3766,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2109, "end": 5121, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3158,9 +3778,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5065, "end": 5644, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3168,9 +3790,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5583, "end": 5877, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3178,9 +3802,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5854, "end": 6073, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", @@ -3188,9 +3814,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5993, "end": 6074, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6346153846153846, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3198,9 +3826,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6085, "end": 6331, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3208,9 +3838,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6248, "end": 8789, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3218,9 +3850,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8370, "end": 8466, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3228,9 +3862,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8371, "end": 8656, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3238,9 +3874,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8790, "end": 9411, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3250,9 +3888,11 @@ "MK115570.1": [ { "name": "gag", - "orientation": "forward", "start": 687, "end": 2193, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.25119999999999987, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -3260,9 +3900,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1979, "end": 4991, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14456630109670976, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3270,9 +3912,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4935, "end": 5514, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3280,9 +3924,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5453, "end": 5747, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3290,9 +3936,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5724, "end": 5940, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3300,9 +3948,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5863, "end": 5941, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -3310,9 +3960,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5955, "end": 6201, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3320,9 +3972,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6118, "end": 8659, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49649532710280364, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3330,9 +3984,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8240, "end": 8336, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3340,9 +3996,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8241, "end": 8526, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3350,9 +4008,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8660, "end": 9281, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3362,9 +4022,11 @@ "MK115509.1": [ { "name": "gag", - "orientation": "forward", "start": 555, "end": 2061, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -3372,9 +4034,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1847, "end": 4859, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3382,9 +4046,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4803, "end": 5382, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3392,9 +4058,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5321, "end": 5615, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3402,9 +4070,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5592, "end": 5808, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3412,9 +4082,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5731, "end": 5809, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -3422,9 +4094,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5823, "end": 6069, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3432,9 +4106,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5986, "end": 8527, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49135514018691584, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3442,9 +4118,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8108, "end": 8204, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3452,9 +4130,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8109, "end": 8394, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3462,9 +4142,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8528, "end": 9149, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3474,9 +4156,11 @@ "MK115702.1": [ { "name": "gag", - "orientation": "forward", "start": 246, "end": 1782, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2866000000000015, "protein": "MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ*", @@ -3484,9 +4168,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1544, "end": 4586, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.18175473579262214, "protein": "FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3494,9 +4180,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4530, "end": 5109, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.34375, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -3504,9 +4192,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5048, "end": 5342, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44230769230769296, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*P", @@ -3514,9 +4204,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5319, "end": 5535, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6319444444444446, "protein": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", "aminoacids": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", @@ -3524,9 +4216,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5458, "end": 5536, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.8076923076923077, "protein": "MAGRSGDGDEDLLKAVRLIKTLYQSS", "aminoacids": "MAGRSGDGDEDLLKAVRLIKTLYQSS", @@ -3534,9 +4228,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5550, "end": 5808, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.807317073170732, "protein": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND", "aminoacids": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**", @@ -3544,9 +4240,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5716, "end": 8257, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.6026869158878512, "protein": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE", "aminoacids": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*", @@ -3554,9 +4252,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7874, "end": 7970, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.6866666666666661, "protein": "RPASQSRGDPTGPKEPKKKVERETETDPTD", "aminoacids": "RPASQSRGDPTGPKEPKKKVERETETDPTD**", @@ -3564,9 +4264,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7875, "end": 8160, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.3296703296703296, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE", "aminoacids": "DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*CC*", @@ -3574,9 +4276,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8275, "end": 8896, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.658536585365846, "protein": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC", "aminoacids": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*", @@ -3586,9 +4290,11 @@ "MK115095.1": [ { "name": "gag", - "orientation": "forward", "start": 2, "end": 1697, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 1.8384000000000005, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC", "aminoacids": "SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*", @@ -3596,9 +4302,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1489, "end": 4579, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 1.9898305084745753, "protein": "KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK", "aminoacids": "FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*NMEQFSKTPYAYFKESSEMSLQTSP*", @@ -3606,9 +4314,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4445, "end": 5024, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 1.8546875000000016, "protein": "MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR", "aminoacids": "MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH*", @@ -3616,9 +4326,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4963, "end": 5257, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5961538461538467, "protein": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS", "aminoacids": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*L", @@ -3626,9 +4338,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5288, "end": 5453, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 1.1236111111111113, "protein": "MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ", "aminoacids": "MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*", @@ -3636,9 +4350,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5373, "end": 5451, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6538461538461537, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", @@ -3646,9 +4362,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5465, "end": 5711, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 1.3548780487804881, "protein": "SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP", "aminoacids": "MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*", @@ -3656,9 +4374,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5628, "end": 8229, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.8721962616822374, "protein": "MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD", "aminoacids": "MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*", @@ -3666,9 +4386,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7810, "end": 7903, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPSSQPRGDPTGPKEQKKEVERKTEAHPRD", "aminoacids": "RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*", @@ -3676,9 +4398,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7811, "end": 8087, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 1.2406593406593407, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE", "aminoacids": "DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*", @@ -3686,9 +4410,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8287, "end": 8878, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.9788617886178801, "protein": "MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", "aminoacids": "MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*H*", @@ -3698,9 +4424,11 @@ "MK115490.1": [ { "name": "gag", - "orientation": "forward", "start": 549, "end": 2055, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -3708,9 +4436,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1841, "end": 4853, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3718,9 +4448,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4797, "end": 5376, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.36979166666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3728,9 +4460,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5315, "end": 5609, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3738,9 +4472,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5586, "end": 5802, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3748,9 +4484,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5725, "end": 5803, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -3758,9 +4496,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5817, "end": 6063, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6500000000000001, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3768,9 +4508,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5980, "end": 8521, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4941588785046729, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3778,9 +4520,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8102, "end": 8198, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3788,9 +4532,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8103, "end": 8388, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.4285714285714286, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3798,9 +4544,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8522, "end": 9143, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5918699186991796, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3810,9 +4558,11 @@ "MK115576.1": [ { "name": "gag", - "orientation": "forward", "start": 468, "end": 1974, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.2571999999999999, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", "aminoacids": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*R*", @@ -3820,9 +4570,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1760, "end": 4772, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14755732801595212, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3830,9 +4582,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4716, "end": 5295, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.35416666666666674, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", "aminoacids": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*", @@ -3840,9 +4594,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5234, "end": 5528, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4038461538461544, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", "aminoacids": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*T", @@ -3850,9 +4606,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5505, "end": 5721, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3860,9 +4618,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5644, "end": 5722, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", @@ -3870,9 +4630,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5736, "end": 5982, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6865853658536587, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", "aminoacids": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*", @@ -3880,9 +4642,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5899, "end": 8440, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49018691588785046, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", "aminoacids": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*", @@ -3890,9 +4654,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8021, "end": 8117, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.28666666666666596, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", "aminoacids": "RPTSQPRGDPTGPKESKKKVEKETETDQFD**", @@ -3900,9 +4666,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8022, "end": 8307, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*CY*", @@ -3910,9 +4678,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8441, "end": 9062, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6162601626016186, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", "aminoacids": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*H*", @@ -3922,9 +4692,11 @@ "OQ092466": [ { "name": "gag", - "orientation": "forward", "start": 825, "end": 2361, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.16679999999999984, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ*", @@ -3932,9 +4704,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2147, "end": 5165, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14356929212362912, "protein": "FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -3942,9 +4716,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5109, "end": 5688, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.203125, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -3952,9 +4728,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5627, "end": 5921, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.3653846153846132, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*A", @@ -3962,9 +4740,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5898, "end": 6114, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.45833333333333326, "protein": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", @@ -3972,9 +4752,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 6037, "end": 6115, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDDELLKTVRLIKVLYQSS", "aminoacids": "MAGRSGDSDDELLKTVRLIKVLYQSS", @@ -3982,9 +4764,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6129, "end": 6375, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6097560975609757, "protein": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL", "aminoacids": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*", @@ -3992,9 +4776,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6292, "end": 8902, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5255841121495328, "protein": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL", "aminoacids": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*DGWQMVKK*", @@ -4002,9 +4788,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8456, "end": 8552, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.886666666666666, "protein": "RSTPQLRGDPTGPKESKEKVERETETDPVH", "aminoacids": "RSTPQLRGDPTGPKESKEKVERETETDPVH**", @@ -4012,9 +4800,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8457, "end": 8733, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.3626373626373627, "protein": "DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE", "aminoacids": "DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*", @@ -4022,9 +4812,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8876, "end": 9509, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5040650406503988, "protein": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC", "aminoacids": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*", @@ -4034,9 +4826,11 @@ "OQ092463": [ { "name": "gag", - "orientation": "forward", "start": 801, "end": 2313, + "subtype_start": 140, + "subtype_end": 1643, + "orientation": "forward", "distance": 0.20240000000000014, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ*", @@ -4044,9 +4838,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2105, "end": 5117, + "subtype_start": 1435, + "subtype_end": 4447, + "orientation": "forward", "distance": 0.10767696909272173, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -4054,9 +4850,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5061, "end": 5640, + "subtype_start": 4391, + "subtype_end": 4970, + "orientation": "forward", "distance": 0.296875, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -4064,9 +4862,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5579, "end": 5870, + "subtype_start": 4909, + "subtype_end": 5200, + "orientation": "forward", "distance": 0.30208333333333326, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS*", @@ -4074,9 +4874,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5850, "end": 6066, + "subtype_start": 5180, + "subtype_end": 5395, + "orientation": "forward", "distance": 0.38888888888888884, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", @@ -4084,9 +4886,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5989, "end": 6067, + "subtype_start": 5319, + "subtype_end": 5395, + "orientation": "forward", "distance": 0.34615384615384626, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSS", "aminoacids": "MAGRSGDSDEELIKTVRLIKLLYQSS", @@ -4094,9 +4898,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6081, "end": 6330, + "subtype_start": 5411, + "subtype_end": 5657, + "orientation": "forward", "distance": 0.44999999999999996, "protein": "MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", "aminoacids": "MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*", @@ -4104,9 +4910,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6244, "end": 8827, + "subtype_start": 5574, + "subtype_end": 8124, + "orientation": "forward", "distance": 0.44534746760895216, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL", "aminoacids": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL*", @@ -4114,9 +4922,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8408, "end": 8504, + "subtype_start": 7705, + "subtype_end": 7798, + "orientation": "forward", "distance": 0.6000000000000001, "protein": "RPTPQPRGDPTGQKESEKKVERETETDPDH", "aminoacids": "RPTPQPRGDPTGQKESEKKVERETETDPDH**", @@ -4124,9 +4934,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8409, "end": 8685, + "subtype_start": 7706, + "subtype_end": 7982, + "orientation": "forward", "distance": 0.3296703296703296, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*", @@ -4134,9 +4946,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8828, "end": 9461, + "subtype_start": 8125, + "subtype_end": 8752, + "orientation": "forward", "distance": 0.29182692307692304, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", "aminoacids": "MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*", @@ -4146,9 +4960,11 @@ "OQ092465": [ { "name": "gag", - "orientation": "forward", "start": 855, "end": 2364, + "subtype_start": 200, + "subtype_end": 1700, + "orientation": "forward", "distance": 0.3737903225806454, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ*R*", @@ -4156,9 +4972,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2150, "end": 5162, + "subtype_start": 1492, + "subtype_end": 4504, + "orientation": "forward", "distance": 0.1734795613160518, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -4166,9 +4984,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5106, "end": 5685, + "subtype_start": 4448, + "subtype_end": 5027, + "orientation": "forward", "distance": 0.33854166666666674, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -4176,9 +4996,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5624, "end": 5915, + "subtype_start": 4966, + "subtype_end": 5257, + "orientation": "forward", "distance": 0.17708333333333326, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS*", @@ -4186,9 +5008,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5895, "end": 6111, + "subtype_start": 5237, + "subtype_end": 5452, + "orientation": "forward", "distance": 0.25, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", @@ -4196,9 +5020,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 6034, "end": 6112, + "subtype_start": 5376, + "subtype_end": 5452, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSS", "aminoacids": "MAGRSGDSDEELIKTVRLIKLLYQSS", @@ -4206,9 +5032,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6126, "end": 6375, + "subtype_start": 5468, + "subtype_end": 5708, + "orientation": "forward", "distance": 0.3063291139240505, "protein": "MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", "aminoacids": "MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*", @@ -4216,9 +5044,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6289, "end": 8881, + "subtype_start": 5631, + "subtype_end": 8208, + "orientation": "forward", "distance": 0.5249417249417256, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", "aminoacids": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*", @@ -4226,9 +5056,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8462, "end": 8558, + "subtype_start": 7789, + "subtype_end": 7882, + "orientation": "forward", "distance": 3.5, "protein": "RPTSQPRGDPTGQKESKEKVERETETDPDH", "aminoacids": "RPTSQPRGDPTGQKESKEKVERETETDPDH**", @@ -4236,9 +5068,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8463, "end": 8739, + "subtype_start": 7790, + "subtype_end": 8066, + "orientation": "forward", "distance": 0.41758241758241765, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*", @@ -4246,9 +5080,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8882, "end": 9515, + "subtype_start": 8209, + "subtype_end": 8842, + "orientation": "forward", "distance": 0.3285714285714285, "protein": "MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", "aminoacids": "MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*", @@ -4258,9 +5094,11 @@ "OQ092462": [ { "name": "gag", - "orientation": "forward", "start": 767, "end": 2270, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.27679999999999993, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ*", @@ -4268,9 +5106,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2062, "end": 5074, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.1495513459621136, "protein": "FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -4278,9 +5118,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5018, "end": 5597, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.34375, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH*", @@ -4288,9 +5130,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5536, "end": 5830, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.32692307692307465, "protein": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS", "aminoacids": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*P", @@ -4298,9 +5142,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5807, "end": 6026, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.41666666666666674, "protein": "MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ", "aminoacids": "MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*", @@ -4308,9 +5154,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5946, "end": 6024, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLKAVRLIKFLYQSS", "aminoacids": "MAGRSGDSDEELLKAVRLIKFLYQSS", @@ -4318,9 +5166,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6038, "end": 6284, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7073170731707319, "protein": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL", "aminoacids": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*", @@ -4328,9 +5178,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6201, "end": 8844, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.5698598130841122, "protein": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL", "aminoacids": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*DGWQGVKNEGMGCCKGKNEAN*", @@ -4338,9 +5190,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8359, "end": 8455, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPASQPRGDPTGPKEPTKKVERETETDPDH", "aminoacids": "RPASQPRGDPTGPKEPTKKVERETETDPDH**", @@ -4348,9 +5202,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8360, "end": 8636, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.39560439560439553, "protein": "DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE", "aminoacids": "DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*", @@ -4358,9 +5214,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8779, "end": 9406, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.7422764227642202, "protein": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC", "aminoacids": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*", @@ -4370,9 +5228,11 @@ "OQ092464": [ { "name": "gag", - "orientation": "forward", "start": 773, "end": 2282, + "subtype_start": 200, + "subtype_end": 1700, + "orientation": "forward", "distance": 0.38588709677419364, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*R*", @@ -4380,9 +5240,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2068, "end": 5080, + "subtype_start": 1492, + "subtype_end": 4504, + "orientation": "forward", "distance": 0.1734795613160518, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -4390,9 +5252,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5024, "end": 5603, + "subtype_start": 4448, + "subtype_end": 5027, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -4400,9 +5264,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5542, "end": 5833, + "subtype_start": 4966, + "subtype_end": 5257, + "orientation": "forward", "distance": 0.20833333333333326, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS*", @@ -4410,9 +5276,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5813, "end": 6032, + "subtype_start": 5237, + "subtype_end": 5452, + "orientation": "forward", "distance": 0.25, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ*", @@ -4420,9 +5288,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5952, "end": 6030, + "subtype_start": 5376, + "subtype_end": 5452, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEELLQTVRLIKLLYQSS", "aminoacids": "MAGRSGDSDEELLQTVRLIKLLYQSS", @@ -4430,9 +5300,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6044, "end": 6290, + "subtype_start": 5468, + "subtype_end": 5708, + "orientation": "forward", "distance": 0.4265822784810127, "protein": "MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL", "aminoacids": "MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL*", @@ -4440,9 +5312,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6207, "end": 8790, + "subtype_start": 5631, + "subtype_end": 8208, + "orientation": "forward", "distance": 0.5058275058275068, "protein": "MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", "aminoacids": "MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*", @@ -4450,9 +5324,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8371, "end": 8467, + "subtype_start": 7789, + "subtype_end": 7882, + "orientation": "forward", "distance": 3.5, "protein": "RPTSQPRGDPTGQKESKKKVERETETDPDH", "aminoacids": "RPTSQPRGDPTGQKESKKKVERETETDPDH**", @@ -4460,9 +5336,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8372, "end": 8648, + "subtype_start": 7790, + "subtype_end": 8066, + "orientation": "forward", "distance": 0.3846153846153846, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE", "aminoacids": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE*", @@ -4470,9 +5348,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8791, "end": 9412, + "subtype_start": 8209, + "subtype_end": 8842, + "orientation": "forward", "distance": 0.3542857142857141, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", "aminoacids": "MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*", @@ -4482,9 +5362,11 @@ "OQ092467": [ { "name": "gag", - "orientation": "forward", "start": 808, "end": 2308, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.24380000000000002, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ*", @@ -4492,9 +5374,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2100, "end": 5112, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.14356929212362912, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -4502,9 +5386,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5056, "end": 5644, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.43229166666666674, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*SF*", @@ -4512,9 +5398,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5574, "end": 5868, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.4807692307692313, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*T", @@ -4522,9 +5410,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5845, "end": 6064, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*", @@ -4532,9 +5422,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5984, "end": 6065, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6346153846153846, "protein": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", "aminoacids": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", @@ -4542,9 +5434,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6076, "end": 6340, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.5439024390243903, "protein": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL", "aminoacids": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*", @@ -4552,9 +5446,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6239, "end": 8807, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.49988317757009404, "protein": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL", "aminoacids": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*", @@ -4562,9 +5458,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8388, "end": 8484, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.886666666666666, "protein": "RPASQLRGDQTGPKEQKKKVERETETDPGN", "aminoacids": "RPASQLRGDQTGPKEQKKKVERETETDPGN**", @@ -4572,9 +5470,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8389, "end": 8674, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.38351648351648326, "protein": "DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC", "aminoacids": "DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*", @@ -4582,9 +5482,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8808, "end": 9417, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.6048780487804808, "protein": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC", "aminoacids": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*", diff --git a/tests/expected-results-single-csv/orfs.csv b/tests/expected-results-single-csv/orfs.csv index b97f18a..1c28581 100644 --- a/tests/expected-results-single-csv/orfs.csv +++ b/tests/expected-results-single-csv/orfs.csv @@ -1,12 +1,12 @@ -seqid,name,start,end,orientation,distance,protein,aminoacids -MN692145,gag,775,2287,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R* -MN692145,pol,2070,5085,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED* -MN692145,vif,5029,5608,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH* -MN692145,vpr,5547,5841,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T -MN692145,tat_exon1,5818,6037,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ* -MN692145,rev_exon1,5957,6038,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK -MN692145,vpu,6049,6298,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL* -MN692145,env,6212,8783,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL* -MN692145,tat_exon2,8364,8460,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH** -MN692145,rev_exon2,8365,8641,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE* -MN692145,nef,8784,9576,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA* +seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides +MN692145,gag,775,2287,789,2292,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAG +MN692145,pol,2070,5085,2084,5096,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5608,5040,5619,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5841,5558,5850,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAGACT +MN692145,tat_exon1,5818,6037,5830,6045,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5969,6045,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6061,6310,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6224,8795,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8376,8469,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8377,8653,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9576,8796,9417,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAA diff --git a/tests/expected-results-single/orfs.json b/tests/expected-results-single/orfs.json index ea9ef80..633cbe1 100644 --- a/tests/expected-results-single/orfs.json +++ b/tests/expected-results-single/orfs.json @@ -2,9 +2,11 @@ "MN692145": [ { "name": "gag", - "orientation": "forward", "start": 775, "end": 2287, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.15900000000000003, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*", @@ -12,9 +14,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2070, "end": 5085, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.10618145563310066, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*", @@ -22,9 +26,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5029, "end": 5608, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.21875, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*", @@ -32,9 +38,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5547, "end": 5841, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44358974358974423, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T", @@ -42,9 +50,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5818, "end": 6037, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", "aminoacids": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*", @@ -52,9 +62,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5957, "end": 6038, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5192307692307692, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -62,9 +74,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6049, "end": 6298, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.5804878048780489, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", @@ -72,9 +86,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6212, "end": 8783, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4975467289719626, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", @@ -82,9 +98,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8364, "end": 8460, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", "aminoacids": "RPASQPRGDPTGPKESKKKVERETETDPLH**", @@ -92,9 +110,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8365, "end": 8641, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.2637362637362637, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", "aminoacids": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*", @@ -102,9 +122,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8784, "end": 9576, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.3878048780487735, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*", diff --git a/tests/expected-results-small-csv/orfs.csv b/tests/expected-results-small-csv/orfs.csv index 9ab9398..8cb23c6 100644 --- a/tests/expected-results-small-csv/orfs.csv +++ b/tests/expected-results-small-csv/orfs.csv @@ -1,56 +1,56 @@ -seqid,name,start,end,orientation,distance,protein,aminoacids -KX505501.1,env,0,1824,forward,1.9898364485981306,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,gag,336,1824,forward,0.3622000000000025,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,vif,1306,1927,forward,2.1463541666666663,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,nef,1306,1927,forward,2.1430894308943085,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,pol,1628,1748,forward,2.1349950149551358,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN* -KX505501.1,tat_exon2,1746,1824,forward,2.12,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ* -KX505501.1,vpu,1747,1927,forward,2.098780487804878,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,rev_exon2,1747,1927,forward,1.9802197802197803,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI* -KX505501.1,vpr,1748,1751,forward,2.1884615384615382,M,M -KX505501.1,tat_exon1,1748,1751,forward,2.1875,M,M -KX505501.1,rev_exon1,1748,1751,forward,2.1653846153846152,M,M -MN691959,gag,639,2142,forward,0.05400000000000005,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ* -MN691959,pol,1934,4946,forward,0.03589232303090717,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MN691959,vif,4890,5469,forward,0.0625,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH* -MN691959,vpr,5408,5702,forward,0.21153846153845945,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T -MN691959,tat_exon1,5679,5895,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ -MN691959,rev_exon1,5818,5896,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKFLYQSS,MAGRSGDSDEDLLKTVRLIKFLYQSS -MN691959,vpu,5910,6156,forward,0.7060975609756097,SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL* -MN691959,env,6070,8683,forward,0.0867990654205606,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK* -MN691959,tat_exon2,8237,8333,forward,0.19999999999999996,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD** -MN691959,rev_exon2,8238,8514,forward,0.16483516483516492,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE* -MN691959,nef,8657,9278,forward,0.16991869918698432,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC* -MN692074,env,2,4115,forward,1.9582943925233647,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,gag,789,2292,forward,0.13880000000000003,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ* -MN692074,pol,2084,4115,forward,0.7912263210369039,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,vif,3617,4115,forward,1.9968750000000002,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,vpr,3617,4085,forward,1.9602564102564104,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT -MN692074,nef,3617,4115,forward,1.965040650406504,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI* -MN692074,tat_exon1,3823,4084,forward,2.0305555555555554,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY -MN692074,rev_exon1,3823,4084,forward,2.0153846153846153,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY -MN692074,vpu,4080,4164,forward,2.09390243902439,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692074,tat_exon2,4080,4164,forward,2.1133333333333333,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692074,rev_exon2,4080,4164,forward,2.065934065934066,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI* -MN692145,gag,775,2287,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R* -MN692145,pol,2070,5085,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED* -MN692145,vif,5029,5608,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH* -MN692145,vpr,5547,5841,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T -MN692145,tat_exon1,5818,6037,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ* -MN692145,rev_exon1,5957,6038,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK -MN692145,vpu,6049,6298,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL* -MN692145,env,6212,8783,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL* -MN692145,tat_exon2,8364,8460,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH** -MN692145,rev_exon2,8365,8641,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE* -MN692145,nef,8784,9576,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA* -MN090335,gag,315,1665,forward,0.8911999999999998,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ* -MN090335,pol,1427,4469,forward,0.2169491525423728,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED* -MN090335,vif,4413,5001,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF* -MN090335,vpr,4931,5225,forward,0.5192307692307698,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T -MN090335,tat_exon1,5202,5418,forward,0.45833333333333326,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ -MN090335,rev_exon1,5341,5419,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS -MN090335,vpu,5433,5682,forward,0.6560975609756099,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL* -MN090335,env,5596,8158,forward,0.6022196261682247,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ* -MN090335,tat_exon2,7739,7835,forward,0.3999999999999999,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED** -MN090335,rev_exon2,7740,8016,forward,0.46153846153846145,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE* -MN090335,nef,8159,8819,forward,0.5260162601625942,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H* +seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides +KX505501.1,env,0,1824,6224,8795,forward,1.9898364485981306,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,gag,336,1824,789,2292,forward,0.3622000000000025,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vif,1306,1927,5040,5619,forward,2.1463541666666663,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,nef,1306,1927,8796,9417,forward,2.1430894308943085,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,pol,1628,1748,2084,5096,forward,2.1349950149551358,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN,FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN*,TTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAG +KX505501.1,tat_exon2,1746,1824,8376,8469,forward,2.12,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1747,1927,6061,6310,forward,2.098780487804878,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,rev_exon2,1747,1927,8377,8653,forward,1.9802197802197803,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,vpr,1748,1751,5558,5850,forward,2.1884615384615382,M,M,ATG +KX505501.1,tat_exon1,1748,1751,5830,6045,forward,2.1875,M,M,ATG +KX505501.1,rev_exon1,1748,1751,5969,6045,forward,2.1653846153846152,M,M,ATG +MN691959,gag,639,2142,789,2292,forward,0.05400000000000005,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN691959,pol,1934,4946,2084,5096,forward,0.03589232303090717,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN691959,vif,4890,5469,5040,5619,forward,0.0625,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG +MN691959,vpr,5408,5702,5558,5850,forward,0.21153846153845945,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACT +MN691959,tat_exon1,5679,5895,5830,6045,forward,0.29166666666666674,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG +MN691959,rev_exon1,5818,5896,5969,6045,forward,0.5769230769230769,MAGRSGDSDEDLLKTVRLIKFLYQSS,MAGRSGDSDEDLLKTVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGT +MN691959,vpu,5910,6156,6061,6310,forward,0.7060975609756097,SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8683,6224,8795,forward,0.0867990654205606,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAAGATGGGTGGCAAGTGGTCAAAAAGTAG +MN691959,tat_exon2,8237,8333,8376,8469,forward,0.19999999999999996,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8514,8377,8653,forward,0.16483516483516492,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9278,8796,9417,forward,0.16991869918698432,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,env,2,4115,6224,8795,forward,1.9582943925233647,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,gag,789,2292,789,2292,forward,0.13880000000000003,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692074,pol,2084,4115,2084,5096,forward,0.7912263210369039,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vif,3617,4115,5040,5619,forward,1.9968750000000002,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpr,3617,4085,5558,5850,forward,1.9602564102564104,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACC +MN692074,nef,3617,4115,8796,9417,forward,1.965040650406504,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4084,5830,6045,forward,2.0305555555555554,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4084,5969,6045,forward,2.0153846153846153,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,vpu,4080,4164,6061,6310,forward,2.09390243902439,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,tat_exon2,4080,4164,8376,8469,forward,2.1133333333333333,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4080,4164,8377,8653,forward,2.065934065934066,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692145,gag,775,2287,789,2292,forward,0.15900000000000003,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAG +MN692145,pol,2070,5085,2084,5096,forward,0.10618145563310066,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5608,5040,5619,forward,0.21875,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5841,5558,5850,forward,0.44358974358974423,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAGACT +MN692145,tat_exon1,5818,6037,5830,6045,forward,0.29166666666666674,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6038,5969,6045,forward,0.5192307692307692,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6298,6061,6310,forward,0.5804878048780489,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8783,6224,8795,forward,0.4975467289719626,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8460,8376,8469,forward,0.4866666666666659,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8641,8377,8653,forward,0.2637362637362637,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9576,8796,9417,forward,0.3878048780487735,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAA +MN090335,gag,315,1665,789,2292,forward,0.8911999999999998,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MN090335,pol,1427,4469,2084,5096,forward,0.2169491525423728,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090335,vif,4413,5001,5040,5619,forward,0.34375,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAG +MN090335,vpr,4931,5225,5558,5850,forward,0.5192307692307698,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAGACT +MN090335,tat_exon1,5202,5418,5830,6045,forward,0.45833333333333326,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG +MN090335,rev_exon1,5341,5419,5969,6045,forward,0.6923076923076923,MAGRSGDRDEDLLKTVRLIKFLYQSS,MAGRSGDRDEDLLKTVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGT +MN090335,vpu,5433,5682,6061,6310,forward,0.6560975609756099,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8158,6224,8795,forward,0.6022196261682247,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7835,8376,8469,forward,0.3999999999999999,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8016,8377,8653,forward,0.46153846153846145,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8819,8796,9417,forward,0.5260162601625942,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGACACTGA diff --git a/tests/expected-results-small/orfs.json b/tests/expected-results-small/orfs.json index 5cdefb5..ad5aae9 100644 --- a/tests/expected-results-small/orfs.json +++ b/tests/expected-results-small/orfs.json @@ -2,9 +2,11 @@ "KX505501.1": [ { "name": "env", - "orientation": "forward", "start": 0, "end": 1824, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.9898364485981306, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", @@ -12,9 +14,11 @@ }, { "name": "gag", - "orientation": "forward", "start": 336, "end": 1824, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.3622000000000025, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*", @@ -22,9 +26,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 1306, "end": 1927, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 2.1463541666666663, "protein": "MRTQIVKLF", "aminoacids": "MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -32,9 +38,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 1306, "end": 1927, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 2.1430894308943085, "protein": "MRTQIVKLF", "aminoacids": "MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -42,9 +50,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1628, "end": 1748, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 2.1349950149551358, "protein": "FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN", "aminoacids": "FCRENLAFPQGKAGEFPSEQTRANSPTSRELQVWGRDTN*", @@ -52,9 +62,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 1746, "end": 1824, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 2.12, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", "aminoacids": "RCIRSTTRTADTELFTRDFPLGTFQ*", @@ -62,9 +74,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 1747, "end": 1927, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 2.098780487804878, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -72,9 +86,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 1747, "end": 1927, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 1.9802197802197803, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", "aminoacids": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*", @@ -82,9 +98,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 2.1884615384615382, "protein": "M", "aminoacids": "M", @@ -92,9 +110,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.1875, "protein": "M", "aminoacids": "M", @@ -102,9 +122,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 1748, "end": 1751, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.1653846153846152, "protein": "M", "aminoacids": "M", @@ -114,9 +136,11 @@ "MN691959": [ { "name": "gag", - "orientation": "forward", "start": 639, "end": 2142, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.05400000000000005, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*", @@ -124,9 +148,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1934, "end": 4946, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.03589232303090717, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -134,9 +160,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4890, "end": 5469, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.0625, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*", @@ -144,9 +172,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5408, "end": 5702, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.21153846153845945, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", "aminoacids": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*T", @@ -154,9 +184,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5679, "end": 5895, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", @@ -164,9 +196,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5818, "end": 5896, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5769230769230769, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSS", "aminoacids": "MAGRSGDSDEDLLKTVRLIKFLYQSS", @@ -174,9 +208,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5910, "end": 6156, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.7060975609756097, "protein": "SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL", "aminoacids": "MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*", @@ -184,9 +220,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6070, "end": 8683, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.0867990654205606, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", "aminoacids": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*DGWQVVKK*", @@ -194,9 +232,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8237, "end": 8333, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.19999999999999996, "protein": "RPTSQTRGDPTGPKE", "aminoacids": "RPTSQTRGDPTGPKE*KKKVERETETDPFD**", @@ -204,9 +244,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8238, "end": 8514, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.16483516483516492, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", "aminoacids": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*", @@ -214,9 +256,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8657, "end": 9278, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.16991869918698432, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", "aminoacids": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*", @@ -226,9 +270,11 @@ "MN692074": [ { "name": "env", - "orientation": "forward", "start": 2, "end": 4115, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 1.9582943925233647, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -236,9 +282,11 @@ }, { "name": "gag", - "orientation": "forward", "start": 789, "end": 2292, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.13880000000000003, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*", @@ -246,9 +294,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2084, "end": 4115, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.7912263210369039, "protein": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -256,9 +306,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 3617, "end": 4115, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 1.9968750000000002, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -266,9 +318,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 3617, "end": 4085, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 1.9602564102564104, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDT", @@ -276,9 +330,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 3617, "end": 4115, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 1.965040650406504, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", "aminoacids": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*", @@ -286,9 +342,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 3823, "end": 4084, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.0305555555555554, "protein": "MVPVRERTHSRSRNLLCRWGS", "aminoacids": "MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY", @@ -296,9 +354,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 3823, "end": 4084, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 2.0153846153846153, "protein": "MVPVRERTHSRSRNLLCRWGS", "aminoacids": "MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY", @@ -306,9 +366,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 2.09390243902439, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -316,9 +378,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 2.1133333333333333, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -326,9 +390,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 4080, "end": 4164, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 2.065934065934066, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", "aminoacids": "IPSGEPSDAAYKQLLFACTGSLWLDQI*", @@ -338,9 +404,11 @@ "MN692145": [ { "name": "gag", - "orientation": "forward", "start": 775, "end": 2287, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.15900000000000003, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", "aminoacids": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*R*", @@ -348,9 +416,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 2070, "end": 5085, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.10618145563310066, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*", @@ -358,9 +428,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 5029, "end": 5608, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.21875, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*", @@ -368,9 +440,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 5547, "end": 5841, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.44358974358974423, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", "aminoacids": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*T", @@ -378,9 +452,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5818, "end": 6037, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.29166666666666674, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", "aminoacids": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*", @@ -388,9 +464,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5957, "end": 6038, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.5192307692307692, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", "aminoacids": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -398,9 +476,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 6049, "end": 6298, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.5804878048780489, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", "aminoacids": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*", @@ -408,9 +488,11 @@ }, { "name": "env", - "orientation": "forward", "start": 6212, "end": 8783, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.4975467289719626, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", "aminoacids": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*", @@ -418,9 +500,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 8364, "end": 8460, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.4866666666666659, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", "aminoacids": "RPASQPRGDPTGPKESKKKVERETETDPLH**", @@ -428,9 +512,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 8365, "end": 8641, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.2637362637362637, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", "aminoacids": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*", @@ -438,9 +524,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8784, "end": 9576, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.3878048780487735, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", "aminoacids": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*HRAFYKGLSAGDFPGEAWPGRGRGVASPQMLHISSCFCLYWVSLVRPDLSLGALWLTREPTA*", @@ -450,9 +538,11 @@ "MN090335": [ { "name": "gag", - "orientation": "forward", "start": 315, "end": 1665, + "subtype_start": 789, + "subtype_end": 2292, + "orientation": "forward", "distance": 0.8911999999999998, "protein": "MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ", "aminoacids": "MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*", @@ -460,9 +550,11 @@ }, { "name": "pol", - "orientation": "forward", "start": 1427, "end": 4469, + "subtype_start": 2084, + "subtype_end": 5096, + "orientation": "forward", "distance": 0.2169491525423728, "protein": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", "aminoacids": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*", @@ -470,9 +562,11 @@ }, { "name": "vif", - "orientation": "forward", "start": 4413, "end": 5001, + "subtype_start": 5040, + "subtype_end": 5619, + "orientation": "forward", "distance": 0.34375, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH", "aminoacids": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*SF*", @@ -480,9 +574,11 @@ }, { "name": "vpr", - "orientation": "forward", "start": 4931, "end": 5225, + "subtype_start": 5558, + "subtype_end": 5850, + "orientation": "forward", "distance": 0.5192307692307698, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", "aminoacids": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*T", @@ -490,9 +586,11 @@ }, { "name": "tat_exon1", - "orientation": "forward", "start": 5202, "end": 5418, + "subtype_start": 5830, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.45833333333333326, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", @@ -500,9 +598,11 @@ }, { "name": "rev_exon1", - "orientation": "forward", "start": 5341, "end": 5419, + "subtype_start": 5969, + "subtype_end": 6045, + "orientation": "forward", "distance": 0.6923076923076923, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSS", "aminoacids": "MAGRSGDRDEDLLKTVRLIKFLYQSS", @@ -510,9 +610,11 @@ }, { "name": "vpu", - "orientation": "forward", "start": 5433, "end": 5682, + "subtype_start": 6061, + "subtype_end": 6310, + "orientation": "forward", "distance": 0.6560975609756099, "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", "aminoacids": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*", @@ -520,9 +622,11 @@ }, { "name": "env", - "orientation": "forward", "start": 5596, "end": 8158, + "subtype_start": 6224, + "subtype_end": 8795, + "orientation": "forward", "distance": 0.6022196261682247, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", "aminoacids": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*", @@ -530,9 +634,11 @@ }, { "name": "tat_exon2", - "orientation": "forward", "start": 7739, "end": 7835, + "subtype_start": 8376, + "subtype_end": 8469, + "orientation": "forward", "distance": 0.3999999999999999, "protein": "RPSSQPRGDQTGPKE", "aminoacids": "RPSSQPRGDQTGPKE*KKKVERETEADPED**", @@ -540,9 +646,11 @@ }, { "name": "rev_exon2", - "orientation": "forward", "start": 7740, "end": 8016, + "subtype_start": 8377, + "subtype_end": 8653, + "orientation": "forward", "distance": 0.46153846153846145, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", "aminoacids": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*", @@ -550,9 +658,11 @@ }, { "name": "nef", - "orientation": "forward", "start": 8159, "end": 8819, + "subtype_start": 8796, + "subtype_end": 9417, + "orientation": "forward", "distance": 0.5260162601625942, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", "aminoacids": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*H*",