diff --git a/intact/intact.py b/intact/intact.py index 332cf19..3c7b6c2 100644 --- a/intact/intact.py +++ b/intact/intact.py @@ -824,7 +824,7 @@ def analyse_single_sequence(writer, sequence, blast_rows): o.distance, str(o.query.protein), str(o.query.aminoacids), - str(sequence[o.query.start:o.query.end].seq), + str(o.query.nucleotides), ) for o in sorted(sequence_orfs + sequence_small_orfs, key=lambda o: o.query.start)] if include_packaging_signal: diff --git a/tests/expected-results-edgy/errors.json b/tests/expected-results-edgy/errors.json index 7fcad74..ff94b05 100644 --- a/tests/expected-results-edgy/errors.json +++ b/tests/expected-results-edgy/errors.json @@ -4,57 +4,57 @@ { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 2988" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 2988" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "small-sequence[REVERSE_COMPLEMENT]", @@ -86,57 +86,57 @@ { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 3006" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 3006" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "singleton-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "singleton-sequence", @@ -168,57 +168,57 @@ { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 3009" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 3009" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "empty-sequence", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "empty-sequence", @@ -245,57 +245,57 @@ { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 3009" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 3009" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "empty-sequence2", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "empty-sequence2", @@ -322,7 +322,7 @@ { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 54" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 54" }, { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED[REVERSE_COMPLEMENT]", @@ -344,7 +344,7 @@ { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-XS[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 54" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 54" }, { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-XS[REVERSE_COMPLEMENT]", @@ -366,57 +366,57 @@ { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 2997" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 2997" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "small-sequence-with-xs", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "small-sequence-with-xs", @@ -453,7 +453,7 @@ { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 54" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 54" }, { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]", @@ -475,57 +475,57 @@ { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 2997" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 2997" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "small-sequence-with-bad-symbols", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "small-sequence-with-bad-symbols", @@ -562,7 +562,7 @@ { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-DASHES[REVERSE_COMPLEMENT]", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 54" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 54" }, { "sequence_name": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-DASHES[REVERSE_COMPLEMENT]", @@ -584,57 +584,57 @@ { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "ORF gag at 1-1498 can have maximum deletions 30, got 1494" + "message": "ORF gag at 1-1497 can have maximum deletions 30, got 1494" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "ORF pol at 1290-4302 can have maximum deletions 30, got 2997" + "message": "ORF pol at 1290-4301 can have maximum deletions 30, got 2997" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "ORF env at 5430-8007 can have maximum deletions 100, got 2574" + "message": "ORF env at 5430-8006 can have maximum deletions 100, got 2574" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 4246-4822 can have maximum deletions 30, got 573" + "message": "Smaller ORF vif at 4246-4821 can have maximum deletions 30, got 573" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 4764-5052 can have maximum deletions 30, got 285" + "message": "Smaller ORF vpr at 4764-5051 can have maximum deletions 30, got 285" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon1 at 5032-5248 can have maximum deletions 30, got 216" + "message": "Smaller ORF tat_exon1 at 5032-5247 can have maximum deletions 30, got 216" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon1 at 5171-5249 can have maximum deletions 30, got 78" + "message": "Smaller ORF rev_exon1 at 5171-5248 can have maximum deletions 30, got 78" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF vpu at 5267-5513 can have maximum deletions 30, got 243" + "message": "Smaller ORF vpu at 5267-5512 can have maximum deletions 30, got 243" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF tat_exon2 at 7567-7663 can have maximum deletions 30, got 90" + "message": "Smaller ORF tat_exon2 at 7567-7662 can have maximum deletions 30, got 90" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 7568-7865 can have maximum deletions 30, got 294" + "message": "Smaller ORF rev_exon2 at 7568-7864 can have maximum deletions 30, got 294" }, { "sequence_name": "small-sequence-with-dashes", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8008-8683 can have maximum deletions 30, got 672" + "message": "Smaller ORF nef at 8008-8682 can have maximum deletions 30, got 672" }, { "sequence_name": "small-sequence-with-dashes", diff --git a/tests/expected-results-edgy/holistic.json b/tests/expected-results-edgy/holistic.json index 8029c4d..ad3e2c4 100644 --- a/tests/expected-results-edgy/holistic.json +++ b/tests/expected-results-edgy/holistic.json @@ -8,7 +8,7 @@ "blast_qseq_coverage": 1.130479522535501, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "small-sequence[REVERSE_COMPLEMENT]": { @@ -20,7 +20,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "singleton-sequence": { @@ -32,7 +32,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "empty-sequence": { @@ -44,7 +44,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "empty-sequence2": { @@ -56,7 +56,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.REVERSED[REVERSE_COMPLEMENT]": { @@ -68,7 +68,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-XS[REVERSE_COMPLEMENT]": { @@ -80,7 +80,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "small-sequence-with-xs": { @@ -92,7 +92,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]": { @@ -104,7 +104,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "small-sequence-with-bad-symbols": { @@ -116,7 +116,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.BUT.WITH-DASHES[REVERSE_COMPLEMENT]": { @@ -128,7 +128,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 }, "small-sequence-with-dashes": { @@ -140,7 +140,7 @@ "blast_qseq_coverage": 0.0, "blast_sseq_orfs_coverage": 0.0, "orfs_start": 1, - "orfs_end": 8007, + "orfs_end": 8006, "blast_n_conseqs": 0 } } \ No newline at end of file diff --git a/tests/expected-results-edgy/orfs.json b/tests/expected-results-edgy/orfs.json index a68a56d..f1a76de 100644 --- a/tests/expected-results-edgy/orfs.json +++ b/tests/expected-results-edgy/orfs.json @@ -3,9 +3,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.0, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -15,9 +15,9 @@ { "name": "pol", "start": 2084, - "end": 5096, + "end": 5095, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.0, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -27,9 +27,9 @@ { "name": "vif", "start": 5040, - "end": 5619, + "end": 5618, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.0, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -39,9 +39,9 @@ { "name": "vpr", "start": 5558, - "end": 5849, + "end": 5848, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.0, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", @@ -51,21 +51,21 @@ { "name": "tat_exon1", "start": 5829, - "end": 6048, + "end": 6044, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.0, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5968, - "end": 6049, + "end": 6048, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.17292490118577064, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", @@ -75,9 +75,9 @@ { "name": "vpu", "start": 6060, - "end": 6309, + "end": 6308, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.0, "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", @@ -87,9 +87,9 @@ { "name": "env", "start": 6223, - "end": 8794, + "end": 8793, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.0, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", @@ -99,9 +99,9 @@ { "name": "tat_exon2", "start": 8375, - "end": 8471, + "end": 8470, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.0, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", @@ -111,9 +111,9 @@ { "name": "rev_exon2", "start": 8376, - "end": 8652, + "end": 8651, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.0, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -123,9 +123,9 @@ { "name": "nef", "start": 8795, - "end": 9416, + "end": 9415, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.0, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -137,9 +137,9 @@ { "name": "gag", "start": 0, - "end": 21, + "end": 20, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -149,9 +149,9 @@ { "name": "pol", "start": 0, - "end": 21, + "end": 20, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.7794791415481068, "protein": "DSGSERX", @@ -161,9 +161,9 @@ { "name": "env", "start": 0, - "end": 21, + "end": 20, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -173,9 +173,9 @@ { "name": "vif", "start": 0, - "end": 21, + "end": 20, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -185,9 +185,9 @@ { "name": "vpr", "start": 0, - "end": 21, + "end": 20, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -197,9 +197,9 @@ { "name": "tat_exon1", "start": 0, - "end": 6, + "end": 5, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -209,9 +209,9 @@ { "name": "rev_exon1", "start": 0, - "end": 6, + "end": 5, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -221,9 +221,9 @@ { "name": "vpu", "start": 0, - "end": 21, + "end": 20, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -233,9 +233,9 @@ { "name": "nef", "start": 0, - "end": 21, + "end": 20, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -245,9 +245,9 @@ { "name": "tat_exon2", "start": 19, - "end": 19, + "end": 18, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -257,9 +257,9 @@ { "name": "rev_exon2", "start": 19, - "end": 19, + "end": 18, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -271,9 +271,9 @@ { "name": "gag", "start": 0, - "end": 3, + "end": 2, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -283,9 +283,9 @@ { "name": "pol", "start": 0, - "end": 3, + "end": 2, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.7801729318524067, "protein": "X", @@ -295,9 +295,9 @@ { "name": "env", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -307,9 +307,9 @@ { "name": "vif", "start": 0, - "end": 3, + "end": 2, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -319,9 +319,9 @@ { "name": "vpr", "start": 0, - "end": 3, + "end": 2, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -331,9 +331,9 @@ { "name": "tat_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -343,9 +343,9 @@ { "name": "rev_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -355,9 +355,9 @@ { "name": "vpu", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -367,9 +367,9 @@ { "name": "nef", "start": 0, - "end": 3, + "end": 2, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -379,9 +379,9 @@ { "name": "tat_exon2", "start": 1, - "end": 1, + "end": 0, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -391,9 +391,9 @@ { "name": "rev_exon2", "start": 1, - "end": 1, + "end": 0, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -405,9 +405,9 @@ { "name": "gag", "start": 0, - "end": 0, + "end": -1, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -417,9 +417,9 @@ { "name": "pol", "start": 0, - "end": 0, + "end": -1, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.78024284744996, "protein": "", @@ -429,9 +429,9 @@ { "name": "env", "start": 0, - "end": 0, + "end": -1, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -441,9 +441,9 @@ { "name": "vif", "start": 0, - "end": 0, + "end": -1, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -453,9 +453,9 @@ { "name": "vpr", "start": 0, - "end": 0, + "end": -1, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -465,9 +465,9 @@ { "name": "tat_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -477,9 +477,9 @@ { "name": "rev_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -489,9 +489,9 @@ { "name": "vpu", "start": 0, - "end": 0, + "end": -1, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -501,9 +501,9 @@ { "name": "tat_exon2", "start": 0, - "end": 0, + "end": -1, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -513,9 +513,9 @@ { "name": "rev_exon2", "start": 0, - "end": 0, + "end": -1, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -525,9 +525,9 @@ { "name": "nef", "start": 0, - "end": 0, + "end": -1, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -539,9 +539,9 @@ { "name": "gag", "start": 0, - "end": 0, + "end": -1, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -551,9 +551,9 @@ { "name": "pol", "start": 0, - "end": 0, + "end": -1, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.78024284744996, "protein": "", @@ -563,9 +563,9 @@ { "name": "env", "start": 0, - "end": 0, + "end": -1, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -575,9 +575,9 @@ { "name": "vif", "start": 0, - "end": 0, + "end": -1, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -587,9 +587,9 @@ { "name": "vpr", "start": 0, - "end": 0, + "end": -1, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -599,9 +599,9 @@ { "name": "tat_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -611,9 +611,9 @@ { "name": "rev_exon1", "start": 0, - "end": 3, + "end": 2, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -623,9 +623,9 @@ { "name": "vpu", "start": 0, - "end": 0, + "end": -1, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -635,9 +635,9 @@ { "name": "tat_exon2", "start": 0, - "end": 0, + "end": -1, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -647,9 +647,9 @@ { "name": "rev_exon2", "start": 0, - "end": 0, + "end": -1, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -659,9 +659,9 @@ { "name": "nef", "start": 0, - "end": 0, + "end": -1, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -673,9 +673,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.440500017556797, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -685,9 +685,9 @@ { "name": "pol", "start": 2084, - "end": 5096, + "end": 5095, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.3413274429367835, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -697,9 +697,9 @@ { "name": "vif", "start": 5040, - "end": 5619, + "end": 5618, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.5405000748615061, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -709,9 +709,9 @@ { "name": "vpr", "start": 5558, - "end": 5849, + "end": 5848, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.4799377378069871, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", @@ -721,21 +721,21 @@ { "name": "tat_exon1", "start": 5829, - "end": 6048, + "end": 6044, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.6071805702217529, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5968, - "end": 6049, + "end": 6048, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", @@ -745,9 +745,9 @@ { "name": "vpu", "start": 6060, - "end": 6309, + "end": 6308, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.6459390862944163, "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", @@ -757,9 +757,9 @@ { "name": "env", "start": 6223, - "end": 8794, + "end": 8793, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.5813365460413784, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", @@ -769,9 +769,9 @@ { "name": "tat_exon2", "start": 8375, - "end": 8471, + "end": 8470, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.6760287393860223, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", @@ -781,9 +781,9 @@ { "name": "rev_exon2", "start": 8376, - "end": 8652, + "end": 8651, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.5593461265103057, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -793,9 +793,9 @@ { "name": "nef", "start": 8795, - "end": 9416, + "end": 9415, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.617079300572162, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -807,9 +807,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.440500017556797, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -819,9 +819,9 @@ { "name": "pol", "start": 2084, - "end": 5096, + "end": 5095, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.3413274429367835, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -831,9 +831,9 @@ { "name": "vif", "start": 5040, - "end": 5619, + "end": 5618, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.5405000748615061, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -843,9 +843,9 @@ { "name": "vpr", "start": 5558, - "end": 5849, + "end": 5848, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.4799377378069871, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", @@ -855,21 +855,21 @@ { "name": "tat_exon1", "start": 5829, - "end": 6048, + "end": 6044, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.6071805702217529, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5968, - "end": 6049, + "end": 6048, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", @@ -879,9 +879,9 @@ { "name": "vpu", "start": 6060, - "end": 6309, + "end": 6308, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.6459390862944163, "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", @@ -891,9 +891,9 @@ { "name": "env", "start": 6223, - "end": 8794, + "end": 8793, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.5813365460413784, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", @@ -903,9 +903,9 @@ { "name": "tat_exon2", "start": 8375, - "end": 8471, + "end": 8470, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.6760287393860223, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", @@ -915,9 +915,9 @@ { "name": "rev_exon2", "start": 8376, - "end": 8652, + "end": 8651, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.5593461265103057, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -927,9 +927,9 @@ { "name": "nef", "start": 8795, - "end": 9416, + "end": 9415, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.617079300572162, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -941,9 +941,9 @@ { "name": "gag", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -953,9 +953,9 @@ { "name": "pol", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.7797603025967217, "protein": "ISRV", @@ -965,9 +965,9 @@ { "name": "env", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -977,9 +977,9 @@ { "name": "vif", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -989,9 +989,9 @@ { "name": "vpr", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -1001,9 +1001,9 @@ { "name": "tat_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -1013,9 +1013,9 @@ { "name": "rev_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -1025,9 +1025,9 @@ { "name": "vpu", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -1037,9 +1037,9 @@ { "name": "nef", "start": 0, - "end": 12, + "end": 11, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -1049,9 +1049,9 @@ { "name": "tat_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -1061,9 +1061,9 @@ { "name": "rev_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -1075,9 +1075,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.440500017556797, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -1087,9 +1087,9 @@ { "name": "pol", "start": 2084, - "end": 5096, + "end": 5095, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.3413274429367835, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1099,9 +1099,9 @@ { "name": "vif", "start": 5040, - "end": 5619, + "end": 5618, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.5405000748615061, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -1111,9 +1111,9 @@ { "name": "vpr", "start": 5558, - "end": 5849, + "end": 5848, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.4799377378069871, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", @@ -1123,21 +1123,21 @@ { "name": "tat_exon1", "start": 5829, - "end": 6048, + "end": 6044, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.6071805702217529, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5968, - "end": 6049, + "end": 6048, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", @@ -1147,9 +1147,9 @@ { "name": "vpu", "start": 6060, - "end": 6309, + "end": 6308, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.6459390862944163, "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", @@ -1159,9 +1159,9 @@ { "name": "env", "start": 6223, - "end": 8794, + "end": 8793, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.5813365460413784, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", @@ -1171,9 +1171,9 @@ { "name": "tat_exon2", "start": 8375, - "end": 8471, + "end": 8470, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.6760287393860223, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", @@ -1183,9 +1183,9 @@ { "name": "rev_exon2", "start": 8376, - "end": 8652, + "end": 8651, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.5593461265103057, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -1195,9 +1195,9 @@ { "name": "nef", "start": 8795, - "end": 9416, + "end": 9415, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.617079300572162, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -1209,9 +1209,9 @@ { "name": "gag", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -1221,9 +1221,9 @@ { "name": "pol", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.7797603025967217, "protein": "ISRV", @@ -1233,9 +1233,9 @@ { "name": "env", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -1245,9 +1245,9 @@ { "name": "vif", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -1257,9 +1257,9 @@ { "name": "vpr", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -1269,9 +1269,9 @@ { "name": "tat_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -1281,9 +1281,9 @@ { "name": "rev_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -1293,9 +1293,9 @@ { "name": "vpu", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -1305,9 +1305,9 @@ { "name": "nef", "start": 0, - "end": 12, + "end": 11, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -1317,9 +1317,9 @@ { "name": "tat_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -1329,9 +1329,9 @@ { "name": "rev_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", @@ -1343,9 +1343,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.440500017556797, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALDKIEEEQNKSKKKAQQAAADTGHSNQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHTARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPPQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -1355,9 +1355,9 @@ { "name": "pol", "start": 2084, - "end": 5096, + "end": 5095, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.3413274429367835, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSPSEAGADRQGTVSFNFPQVTLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVTLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTGATVRAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRNPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1367,9 +1367,9 @@ { "name": "vif", "start": 5040, - "end": 5619, + "end": 5618, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.5405000748615061, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYESPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -1379,9 +1379,9 @@ { "name": "vpr", "start": 5558, - "end": 5849, + "end": 5848, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.4799377378069871, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTRQRRARNGASRS", @@ -1391,21 +1391,21 @@ { "name": "tat_exon1", "start": 5829, - "end": 6048, + "end": 6044, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.6071805702217529, "protein": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFITKALGISYGRKKRRQRRRAHQNSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAGAACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5968, - "end": 6049, + "end": 6048, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELIRTVRLIKLLYQSSK", @@ -1415,9 +1415,9 @@ { "name": "vpu", "start": 6060, - "end": 6309, + "end": 6308, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.6459390862944163, "protein": "MQPIPIVAIVALVVAIIIAIVVWSIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEISALVEMGVEMGHHAPWDVDDL", @@ -1427,9 +1427,9 @@ { "name": "env", "start": 6223, - "end": 8794, + "end": 8793, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.5813365460413784, "protein": "MRVKEKYQHLWRWGWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLKNDTNTNSSSGRMIMEKGEIKNCSFNISTSIRGKVQKEYAFFYKLDIIPIDNDTTSYKLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSVNFTDNAKTIIVQLNTSVEINCTRPNNNTRKRIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNNTLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQIINMWQKVGKAMYAPPISGQIRCSSNITGLLLTRDGGNSNNESEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNHTTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPTPRGPDRPEGTEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGACRAIRHIPRRIRQGLERILL", @@ -1439,9 +1439,9 @@ { "name": "tat_exon2", "start": 8375, - "end": 8471, + "end": 8470, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.6760287393860223, "protein": "RPTSQPRGDPTGPKEPKKKVERETETDPFD", @@ -1451,9 +1451,9 @@ { "name": "rev_exon2", "start": 8376, - "end": 8652, + "end": 8651, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.5593461265103057, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIHSISERILGTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE", @@ -1463,9 +1463,9 @@ { "name": "nef", "start": 8795, - "end": 9416, + "end": 9415, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.617079300572162, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADRVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCYKLVPVEPDKIEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -1477,9 +1477,9 @@ { "name": "gag", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1, - "subtype_end": 1498, + "subtype_end": 1497, "orientation": "forward", "distance": 0.7803451759315906, "protein": "", @@ -1489,9 +1489,9 @@ { "name": "pol", "start": 0, - "end": 12, + "end": 11, "subtype_start": 1290, - "subtype_end": 4302, + "subtype_end": 4301, "orientation": "forward", "distance": 0.7797603025967217, "protein": "ISRV", @@ -1501,9 +1501,9 @@ { "name": "env", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5430, - "subtype_end": 8007, + "subtype_end": 8006, "orientation": "forward", "distance": 0.7802599076361288, "protein": "", @@ -1513,9 +1513,9 @@ { "name": "vif", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4246, - "subtype_end": 4822, + "subtype_end": 4821, "orientation": "forward", "distance": 0.7806712105497112, "protein": "", @@ -1525,9 +1525,9 @@ { "name": "vpr", "start": 0, - "end": 12, + "end": 11, "subtype_start": 4764, - "subtype_end": 5052, + "subtype_end": 5051, "orientation": "forward", "distance": 0.7812035661218425, "protein": "", @@ -1537,9 +1537,9 @@ { "name": "tat_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5032, - "subtype_end": 5248, + "subtype_end": 5247, "orientation": "forward", "distance": 0.7815405696388372, "protein": "", @@ -1549,9 +1549,9 @@ { "name": "rev_exon1", "start": 0, - "end": 15, + "end": 14, "subtype_start": 5171, - "subtype_end": 5249, + "subtype_end": 5248, "orientation": "forward", "distance": 0.7839721254355401, "protein": "", @@ -1561,9 +1561,9 @@ { "name": "vpu", "start": 0, - "end": 12, + "end": 11, "subtype_start": 5267, - "subtype_end": 5513, + "subtype_end": 5512, "orientation": "forward", "distance": 0.7813860351732544, "protein": "", @@ -1573,9 +1573,9 @@ { "name": "nef", "start": 0, - "end": 12, + "end": 11, "subtype_start": 8008, - "subtype_end": 8683, + "subtype_end": 8682, "orientation": "forward", "distance": 0.7805933836772095, "protein": "", @@ -1585,9 +1585,9 @@ { "name": "tat_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7567, - "subtype_end": 7663, + "subtype_end": 7662, "orientation": "forward", "distance": 0.7834691501746216, "protein": "", @@ -1597,9 +1597,9 @@ { "name": "rev_exon2", "start": 12, - "end": 12, + "end": 11, "subtype_start": 7568, - "subtype_end": 7865, + "subtype_end": 7864, "orientation": "forward", "distance": 0.7811712165958367, "protein": "", diff --git a/tests/expected-results-large-csv/errors.csv b/tests/expected-results-large-csv/errors.csv index 4177f70..5e7f1ac 100644 --- a/tests/expected-results-large-csv/errors.csv +++ b/tests/expected-results-large-csv/errors.csv @@ -1,37 +1,37 @@ sequence_name,error,message -KX505501.1,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 2721" -KX505501.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6322 -KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" -KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" -KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 -KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004 -KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions. -KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions. -KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" -KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" +KX505501.1,DeletionInOrf,"ORF pol at 2084-5095 can have maximum deletions 30, got 2721" +KX505501.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6322 +KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5618 can have maximum insertions 90, got 909" +KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5848 can have maximum deletions 30, got 66" +KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892 +KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6045 contains an internal stop codon at 6004 +KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6308 contains out of frame indels that impact 190 positions. +KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 51 positions. +KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 96" +KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 867" KX505501.1,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. KX505501.1,LongDeletion,Query sequence contains a long deletion. KX505501.1,Scramble,Sequence is plus-scrambled. -MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123 -MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 -MN692074,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 981" -MN692074,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 -MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" -MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" -MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 -MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" -MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions. -MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" -MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" +MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6123 +MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 +MN692074,DeletionInOrf,"ORF pol at 2084-5095 can have maximum deletions 30, got 981" +MN692074,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6550 +MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5618 can have maximum deletions 30, got 81" +MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5848 can have maximum insertions 90, got 207" +MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892 +MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6308 can have maximum insertions 90, got 249" +MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 40 positions. +MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 204" +MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 882" MN692074,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. MN692074,LongDeletion,Query sequence contains a long deletion. -MN090335,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 -MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 +MN090335,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 822 +MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 MN090335,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 42 deletions with max tolerance of 10 deletions. MN090335,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, AT." MN090335,Scramble,Sequence is minus-scrambled. MN090335,InternalInversion,Sequence contains an internal inversion. -MN090376,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 +MN090376,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 822 MN090376,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 95 deletions with max tolerance of 10 deletions. MN090376,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MN090376,Scramble,Sequence is minus-scrambled. @@ -45,56 +45,56 @@ MK115514.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice dono MK115488.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115030.1,Scramble,Sequence is minus-scrambled. MK115030.1,InternalInversion,Sequence contains an internal inversion. -MK115211.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6889 +MK115211.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6889 MK115211.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 20 deletions with max tolerance of 10 deletions. MK115211.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115211.1,Scramble,Sequence is minus-scrambled. MK115211.1,InternalInversion,Sequence contains an internal inversion. MK115158.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 20 deletions with max tolerance of 10 deletions. MK115158.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." -MK114705.1,DeletionInOrf,"Smaller ORF nef at 8795-9416 can have maximum deletions 30, got 186" -MK114856.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 873 -MK114856.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2213 -MK114856.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6325 -MK114856.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5172 -MK114856.1,InternalStopInOrf,Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5594 -MK114856.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5919 -MK114856.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 -MK114856.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 -MK114856.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 -MK114856.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8852 +MK114705.1,DeletionInOrf,"Smaller ORF nef at 8795-9415 can have maximum deletions 30, got 186" +MK114856.1,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 873 +MK114856.1,InternalStopInOrf,ORF pol at 2084-5095 contains an internal stop codon at 2213 +MK114856.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6325 +MK114856.1,InternalStopInOrf,Smaller ORF vif at 5040-5618 contains an internal stop codon at 5172 +MK114856.1,InternalStopInOrf,Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5594 +MK114856.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5919 +MK114856.1,InternalStopInOrf,Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126 +MK114856.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 +MK114856.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433 +MK114856.1,InternalStopInOrf,Smaller ORF nef at 8795-9415 contains an internal stop codon at 8852 MK114856.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 3.639064030015132e-65). -MK115009.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 834 -MK115009.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115009.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6349 -MK115009.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5373 -MK115009.1,InternalStopInOrf,Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5717 -MK115009.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859 -MK115009.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 -MK115009.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115009.1,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 834 +MK115009.1,InternalStopInOrf,ORF pol at 2084-5095 contains an internal stop codon at 2183 +MK115009.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6349 +MK115009.1,InternalStopInOrf,Smaller ORF vif at 5040-5618 contains an internal stop codon at 5373 +MK115009.1,InternalStopInOrf,Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5717 +MK115009.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859 +MK115009.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433 +MK115009.1,InternalStopInOrf,Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873 MK115009.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 1.2040967664149076e-41). MK115009.1,Scramble,Sequence is minus-scrambled. MK115009.1,InternalInversion,Sequence contains an internal inversion. -MK115387.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 -MK116110.1,InternalStopInOrf,ORF gag at 140-1643 contains an internal stop codon at 185 +MK115387.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 +MK116110.1,InternalStopInOrf,ORF gag at 140-1642 contains an internal stop codon at 185 MK116110.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 22 deletions with max tolerance of 10 deletions. MK116110.1,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, CC." -MK114997.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6511 +MK114997.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6511 MK115065.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 75 deletions with max tolerance of 10 deletions. MK115065.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115065.1,Scramble,Sequence is plus-scrambled. MK115065.1,InternalInversion,Sequence contains an internal inversion. -MK115464.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 924 -MK115464.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115464.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6424 -MK115464.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5247 -MK115464.1,FrameshiftInOrf,Smaller ORF tat_exon1 at 5829-6045 contains out of frame indels that impact 104 positions. -MK115464.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 -MK115464.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 -MK115464.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 -MK115464.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115464.1,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 924 +MK115464.1,InternalStopInOrf,ORF pol at 2084-5095 contains an internal stop codon at 2183 +MK115464.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6424 +MK115464.1,InternalStopInOrf,Smaller ORF vif at 5040-5618 contains an internal stop codon at 5247 +MK115464.1,FrameshiftInOrf,Smaller ORF tat_exon1 at 5829-6044 contains out of frame indels that impact 104 positions. +MK115464.1,InternalStopInOrf,Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126 +MK115464.1,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 +MK115464.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433 +MK115464.1,InternalStopInOrf,Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873 MK115464.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.937891251407691e-23). -MK115520.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2198 +MK115520.1,InternalStopInOrf,ORF pol at 2084-5095 contains an internal stop codon at 2198 MK115520.1,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, GA." MK115520.1,InternalInversion,Sequence contains an internal inversion. MK115570.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 11 deletions with max tolerance of 10 deletions. @@ -103,14 +103,14 @@ MK115702.1,PackagingSignalDeletion,Query Sequence exceeds maximum deletion toler MK115702.1,MajorSpliceDonorSiteMutated,"Query sequence has a missing splice donor site, --." MK115702.1,Scramble,Sequence is plus-scrambled. MK115702.1,InternalInversion,Sequence contains an internal inversion. -MK115095.1,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 927 -MK115095.1,InternalStopInOrf,ORF pol at 2084-5096 contains an internal stop codon at 2183 -MK115095.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 -MK115095.1,InternalStopInOrf,Smaller ORF vif at 5040-5619 contains an internal stop codon at 5151 -MK115095.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859 -MK115095.1,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126 -MK115095.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433 -MK115095.1,InternalStopInOrf,Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873 +MK115095.1,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 927 +MK115095.1,InternalStopInOrf,ORF pol at 2084-5095 contains an internal stop codon at 2183 +MK115095.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6550 +MK115095.1,InternalStopInOrf,Smaller ORF vif at 5040-5618 contains an internal stop codon at 5151 +MK115095.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859 +MK115095.1,InternalStopInOrf,Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126 +MK115095.1,InternalStopInOrf,Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433 +MK115095.1,InternalStopInOrf,Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873 MK115095.1,APOBECHypermutationDetected,Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 8.33506116803153e-40). OQ092466,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, GC." OQ092463,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 26 deletions with max tolerance of 10 deletions. diff --git a/tests/expected-results-large-csv/holistic.csv b/tests/expected-results-large-csv/holistic.csv index 86f159e..26dee0c 100644 --- a/tests/expected-results-large-csv/holistic.csv +++ b/tests/expected-results-large-csv/holistic.csv @@ -1,42 +1,42 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17663960024984385,789,8794,4 -MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8794,3 -MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.4114928169893816,789,8794,4 -MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 -MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.0003747657713928,789,8794,3 -MN090376,8985,0.026415767987601813,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,8985,0.9784935171846059,1.0604340567612687,0.9943785134291068,789,8794,3 -MK115581.1,9495,0.6919440876652894,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9495,0.987034369211772,1.0046340179041602,1.0,789,8794,2 -MK115690.1,9689,0.051230576250981485,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.004630582424367,1.0113530808132933,1.0,789,8794,3 -MK115571.1,9394,0.8029570594372466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9394,0.9866227618851615,1.0113902490951672,1.0,789,8794,2 -MK115514.1,9382,0.6482462132632603,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9382,0.9864169582218564,1.0173736943082499,1.0,789,8794,2 -MK115488.1,9623,0.6534999185838631,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9623,1.0255196542498457,1.0325262392185388,1.0,789,8794,6 -MK115030.1,9126,0.032014462397289556,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9126,0.994031693764149,1.0655270655270654,1.0,789,8794,3 -MK115498.1,9461,0.83547963060225,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9461,0.9866227618851615,1.0080329774865235,1.0,789,8794,2 -MK115211.1,9032,0.11818291879607423,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9032,0.995060712080675,1.0598981399468557,1.0,789,8794,3 -MK115158.1,9143,0.002572269807584293,Ref.47_BF.ES.08.P1942.GQ372987,9143,0.9921577414295317,0.9699223449633599,1.0,234,8212,1 -MK114705.1,9411,0.14584270737492833,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9411,1.098065445564931,1.122622463075125,1.0,789,8794,6 -MK114856.1,9477,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9477,1.0485696645400289,1.0812493405085997,1.0,789,8794,4 -MK115009.1,9207,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9207,0.9965013377238114,1.0590854784403172,1.0,789,8794,3 -MK115387.1,9136,0.5436355526687852,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9136,0.9796254373327845,1.040936952714536,1.0,789,8794,2 -MK115491.1,9422,0.8961809048805741,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9422,1.0037044659394938,1.0299299511780937,1.0,789,8794,2 -MK116110.1,8967,0.07021438897893317,Ref.B.TH.90.BK132.AY173951,8967,0.9957759004001778,0.9972119995539199,0.998622244488978,140,8124,3 -MK115527.1,9481,0.770862998910788,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9481,0.9867256637168141,1.0056956017297753,1.0,789,8794,2 -MK114997.1,9055,0.05560625344150194,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9055,0.9784935171846059,1.0516841524019878,1.0,789,8794,2 -MK115518.1,9537,0.6408152618300496,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9537,0.9847705289154147,0.9996854356715948,1.0,789,8794,3 -MK115065.1,9214,0.033954952452739495,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9214,1.0080263428689031,1.069459518124593,1.0,789,8794,6 -MK115464.1,9663,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9663,0.9838444124305412,0.9893407844354756,1.0,789,8794,2 -MK115530.1,9544,0.5812621948015355,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9544,0.9866227618851615,0.9992665549036044,1.0,789,8794,2 -MK115520.1,9589,0.5225247969864292,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9589,0.9786993208479111,0.987902805297737,1.0121174266083697,789,8794,3 -MK115503.1,9617,0.42870398270204335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9617,0.987034369211772,0.9953207861079338,1.0,789,8794,2 -MK115570.1,9485,0.7406166892211931,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9485,0.9866227618851615,1.0057986294148655,1.0,789,8794,2 -MK115509.1,9353,0.7883768413537747,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9353,0.9866227618851615,1.0197797498128942,1.0,789,8794,2 -MK115702.1,9098,0.1454272422215308,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9098,0.9874459765383824,1.0596834469114091,1.0198625858838226,789,8794,4 -MK115095.1,9137,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9137,0.9907388351512657,1.060085367188355,1.0,789,8794,2 -MK115490.1,9347,0.8875203448314265,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9347,0.9848734307470673,1.0204343639670483,1.0,789,8794,3 -MK115576.1,9266,0.8197662757563093,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9266,0.9917678534677917,1.0342110943233327,1.0,789,8794,3 -OQ092466,9686,0.3858261890626,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9686,1.1015641078411196,1.1192442700805285,1.0,789,8794,3 -OQ092463,9605,0.21628713708846803,Ref.B.TH.90.BK132.AY173951,9605,1.0529124055135617,0.9884435190005205,1.0,140,8124,2 -OQ092465,9659,0.02412789935966586,Ref.28_BF.BR.99.BREPM12817.DQ085874,9659,1.0429696287964005,0.9620043482762191,1.0,200,8208,2 -OQ092462,9714,0.10883643311676816,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9714,1.1306853261988064,1.1301214741610048,1.0,789,8794,3 -OQ092464,9556,0.006887768010151674,Ref.28_BF.BR.99.BREPM12817.DQ085874,9556,1.0427446569178853,0.9678735872750105,1.0,200,8208,2 -OQ092467,9936,0.6438715160567257,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9936,1.1308911298621116,1.0962157809983897,1.0,789,8794,3 +KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17666166916541728,789,8793,4 +MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8793,3 +MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.411544227886057,789,8793,4 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8793,3 +MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.000374812593703,789,8793,3 +MN090376,8985,0.026415767987601813,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,8985,0.9784935171846059,1.0604340567612687,0.9943778110944528,789,8793,3 +MK115581.1,9495,0.6919440876652894,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9495,0.987034369211772,1.0046340179041602,1.0,789,8793,2 +MK115690.1,9689,0.051230576250981485,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.004630582424367,1.0113530808132933,1.0,789,8793,3 +MK115571.1,9394,0.8029570594372466,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9394,0.9866227618851615,1.0113902490951672,1.0,789,8793,2 +MK115514.1,9382,0.6482462132632603,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9382,0.9864169582218564,1.0173736943082499,1.0,789,8793,2 +MK115488.1,9623,0.6534999185838631,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9623,1.0255196542498457,1.0325262392185388,1.0,789,8793,6 +MK115030.1,9126,0.032014462397289556,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9126,0.994031693764149,1.0655270655270654,1.0,789,8793,3 +MK115498.1,9461,0.83547963060225,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9461,0.9866227618851615,1.0080329774865235,1.0,789,8793,2 +MK115211.1,9032,0.11818291879607423,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9032,0.995060712080675,1.0598981399468557,1.0,789,8793,3 +MK115158.1,9143,0.002572269807584293,Ref.47_BF.ES.08.P1942.GQ372987,9143,0.9921577414295317,0.9699223449633599,1.0,234,8211,1 +MK114705.1,9411,0.14584270737492833,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9411,1.098065445564931,1.122622463075125,1.0,789,8793,6 +MK114856.1,9477,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9477,1.0485696645400289,1.0812493405085997,1.0,789,8793,4 +MK115009.1,9207,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9207,0.9965013377238114,1.0590854784403172,1.0,789,8793,3 +MK115387.1,9136,0.5436355526687852,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9136,0.9796254373327845,1.040936952714536,1.0,789,8793,2 +MK115491.1,9422,0.8961809048805741,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9422,1.0037044659394938,1.0299299511780937,1.0,789,8793,2 +MK116110.1,8967,0.07021438897893317,Ref.B.TH.90.BK132.AY173951,8967,0.9957759004001778,0.9972119995539199,0.9986220719027934,140,8123,3 +MK115527.1,9481,0.770862998910788,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9481,0.9867256637168141,1.0056956017297753,1.0,789,8793,2 +MK114997.1,9055,0.05560625344150194,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9055,0.9784935171846059,1.0516841524019878,1.0,789,8793,2 +MK115518.1,9537,0.6408152618300496,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9537,0.9847705289154147,0.9996854356715948,1.0,789,8793,3 +MK115065.1,9214,0.033954952452739495,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9214,1.0080263428689031,1.069459518124593,1.0,789,8793,6 +MK115464.1,9663,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9663,0.9838444124305412,0.9893407844354756,1.0,789,8793,2 +MK115530.1,9544,0.5812621948015355,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9544,0.9866227618851615,0.9992665549036044,1.0,789,8793,2 +MK115520.1,9589,0.5225247969864292,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9589,0.9786993208479111,0.987902805297737,1.012118940529735,789,8793,3 +MK115503.1,9617,0.42870398270204335,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9617,0.987034369211772,0.9953207861079338,1.0,789,8793,2 +MK115570.1,9485,0.7406166892211931,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9485,0.9866227618851615,1.0057986294148655,1.0,789,8793,2 +MK115509.1,9353,0.7883768413537747,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9353,0.9866227618851615,1.0197797498128942,1.0,789,8793,2 +MK115702.1,9098,0.1454272422215308,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9098,0.9874459765383824,1.0596834469114091,1.0198650674662668,789,8793,4 +MK115095.1,9137,1.0,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9137,0.9907388351512657,1.060085367188355,1.0,789,8793,2 +MK115490.1,9347,0.8875203448314265,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9347,0.9848734307470673,1.0204343639670483,1.0,789,8793,3 +MK115576.1,9266,0.8197662757563093,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9266,0.9917678534677917,1.0342110943233327,1.0,789,8793,3 +OQ092466,9686,0.3858261890626,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9686,1.1015641078411196,1.1192442700805285,1.0,789,8793,3 +OQ092463,9605,0.21628713708846803,Ref.B.TH.90.BK132.AY173951,9605,1.0529124055135617,0.9884435190005205,1.0,140,8123,2 +OQ092465,9659,0.02412789935966586,Ref.28_BF.BR.99.BREPM12817.DQ085874,9659,1.0429696287964005,0.9620043482762191,1.0,200,8207,2 +OQ092462,9714,0.10883643311676816,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9714,1.1306853261988064,1.1301214741610048,1.0,789,8793,3 +OQ092464,9556,0.006887768010151674,Ref.28_BF.BR.99.BREPM12817.DQ085874,9556,1.0427446569178853,0.9678735872750105,1.0,200,8207,2 +OQ092467,9936,0.6438715160567257,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9936,1.1308911298621116,1.0962157809983897,1.0,789,8793,3 diff --git a/tests/expected-results-large-csv/orfs.csv b/tests/expected-results-large-csv/orfs.csv index e886aad..0f44643 100644 --- a/tests/expected-results-large-csv/orfs.csv +++ b/tests/expected-results-large-csv/orfs.csv @@ -1,452 +1,452 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides -KX505501.1,env,0,1824,6223,8794,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,vif,0,1824,5040,5619,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,nef,0,1824,8795,9416,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,tat_exon1,1,1750,5829,6045,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,gag,336,1824,789,2292,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon1,1306,1750,5968,6046,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,vpr,1599,1824,5558,5849,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,vpu,1599,1824,6060,6309,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,pol,1627,1927,2084,5096,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,tat_exon2,1746,1824,8375,8471,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon2,1747,1927,8376,8652,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -MN691959,gag,639,2142,789,2292,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN691959,pol,1934,4946,2084,5096,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN691959,vif,4890,5469,5040,5619,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG -MN691959,vpr,5408,5699,5558,5849,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN691959,tat_exon1,5679,5898,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN691959,rev_exon1,5818,5899,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN691959,vpu,5910,6156,6060,6309,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG -MN691959,env,6070,8656,6223,8794,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA -MN691959,tat_exon2,8237,8333,8375,8471,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA -MN691959,rev_exon2,8238,8514,8376,8652,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG -MN691959,nef,8657,9278,8795,9416,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA -MN692074,nef,0,4059,8795,9416,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG -MN692074,env,2,4115,6223,8794,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,gag,789,2292,789,2292,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN692074,pol,2084,4115,2084,5096,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vif,3617,4115,5040,5619,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpr,3617,4115,5558,5849,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpu,3617,4115,6060,6309,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,tat_exon1,3823,4084,5829,6045,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,rev_exon1,3823,4084,5968,6046,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,tat_exon2,4080,4164,8375,8471,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA -MN692074,rev_exon2,4081,4153,8376,8652,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG -MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA -MN090335,gag,315,1665,789,2292,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA -MN090335,pol,1427,4469,2084,5096,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN090335,vif,4413,4992,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090335,vpr,4931,5222,5558,5849,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG -MN090335,tat_exon1,5202,5421,5829,6045,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA -MN090335,rev_exon1,5341,5422,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG -MN090335,vpu,5433,5682,6060,6309,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG -MN090335,env,5596,8158,6223,8794,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA -MN090335,tat_exon2,7739,7835,8375,8471,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA -MN090335,rev_exon2,7740,8016,8376,8652,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG -MN090335,nef,8159,8813,8795,9416,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA -MN090376,gag,522,1590,789,2292,forward,0.6828741441147701,MYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MHTIEDCYCIK**FKFL*SCLKCWL*LSQYLSTAF*CF*QARINCESFQFPACPYYMF*LISFLSPWP*PNFLPFV*FSPA*YRRSRTHLSPSSLR*SKRRTHRSPPLASCCARFSKPSPIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGCACACAATAGAGGACTGCTACTGTATTAAATAATGATTTAAGTTCCTCTGATCCTGTCTGAAGTGCTGGTTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCCAGTTCCCTGCTTGCCCATACTATATGTTTTAACTTATATCTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATTTGTCTAATTCTCCCCCGCTTAATACCGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAAGGCGTACTCACCGTTCGCCGCCCCTCGCCTCTTGCTGTGCGCGCTTCAGCAAGCCGAGTCCGATAATTCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA -MN090376,pol,1382,4394,2084,5096,forward,0.23966680468616797,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTGACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAGACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGATGAGCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCTGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTCGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN090376,vif,4338,4920,5040,5619,forward,0.42479043044174425,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAGCATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGACTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAAAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090376,vpr,4859,5150,5558,5849,forward,0.36116422349691957,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN090376,tat_exon1,5130,5349,5829,6045,forward,0.46628407460545196,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAA -MN090376,rev_exon1,5269,5350,5968,6046,forward,0.5763097949886105,MAGRSGDSDEELLRIAGTIKFLYQSSK,MAGRSGDSDEELLRIAGTIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAAG -MN090376,vpu,5361,5631,6060,6309,forward,0.5680096940321115,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA -MN090376,env,5524,8110,6223,8794,forward,0.49863720871464445,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -MN090376,tat_exon2,7691,7784,8375,8471,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG -MN090376,rev_exon2,7692,7968,8376,8652,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG -MN090376,nef,8111,8735,8795,9416,forward,0.5036770338593534,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA -MK115581.1,gag,680,2180,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115581.1,pol,1972,4984,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115581.1,vif,4928,5507,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115581.1,vpr,5446,5737,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115581.1,tat_exon1,5717,5936,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115581.1,rev_exon1,5856,5937,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115581.1,vpu,5948,6194,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115581.1,env,6111,8652,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115581.1,tat_exon2,8233,8329,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115581.1,rev_exon2,8234,8510,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115581.1,nef,8653,9268,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115690.1,gag,777,2286,789,2292,forward,0.24076694150363465,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAGTGGGAAAAAATTCGGTTGAGGCCAGGGGGAAAGAAAAAATATAGATTAAAGCATATCGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATAATGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTGTATAATACAGTAGCAACCCTCTATTGTGTACATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGGCGCAGGAAACAGCAGTCAGACCAGCACCAGCCAAAATTACCCTATAGTACAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTCTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACTAATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCCACCAGCATTCTAGACATAAGACAAGGACCAAAGGAGCCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTAGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAGGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGTCATAAAGCAAGAGTTTTAGCGGAAGCAATGAGCCAAGCAACAAATTCAGCTGCCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAAAGTGTTAAGTGTTTTAATTGCGGCAAAGATGGGCACATAGCAAAAAATTGCAGGGCCCCTAGAAGAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTCCAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MK115690.1,pol,2078,5090,2084,5096,forward,0.185747174550021,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGCACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATAGGGCCTGAGAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGACTTCAGAGAACTAAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGACAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAACCTTATAGAAAACAAAATCCAAACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACCTAGAAATAGGGCAGCATAGAATAAAAATAGAAGAACTGAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGACAAGTGGACAGTACAGCCTATAGCGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATCTACCCAGGAATTAAAGTAAGGCAATTATGTAAACTACTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAAAAGAAGCAGAGCTAGAATTAGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGAGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTGACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTGATATGGGGAAAGACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAATCAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTATCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACATGCAATTTATCTAGCTTTGCAAGATTCGGGATTAGAAGTAAATATAGTAACAGACTCACAGTATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTGTTTTTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAGCAGCATACTTTATTTTAAAATTAGCAGGACGATGGCCAGTAGCAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACAGTTAAGGCCGCCTGCTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAACAATGAATTGAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACGTAATAGCAACAGACTTACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAACATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115690.1,vif,5034,5613,5040,5619,forward,0.39766435115272314,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAAGATGGCACAGTTTAGTAAAACACCATATATATATTTCAGGGAAAGCTAGAGGATGGGTTTATAAACATCACTATGAAAACACTCATCCAAGAATAAGTTCAAAAGTATACATCCCACTAGGGGAAGCTAGACTGGCAGTAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGGAATATAGCACACAAGTAGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGTCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTTTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTATTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAG -MK115690.1,vpr,5552,5843,5558,5849,forward,0.37688442211055273,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*,ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAA -MK115690.1,tat_exon1,5823,6042,5829,6045,forward,0.40192926045016075,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ*,ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAA -MK115690.1,rev_exon1,5962,6043,5968,6046,forward,0.524971623155505,MAGRSGDNDEDLLKTVRFIKLLYQSSK,MAGRSGDNDEDLLKTVRFIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAAG -MK115690.1,vpu,6054,6300,6060,6309,forward,0.48542752364408415,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*,ATGCAATCTTTAGCAATATTAGCAATAGTAGCATTAGTAGTAGCAGCCATAATAGCAATAGTTGTGTGGACCATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGATAGTGGCAATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG -MK115690.1,env,6217,8800,6223,8794,forward,0.49751604598034604,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*,ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA -MK115690.1,tat_exon2,8381,8474,8375,8471,forward,0.4918032786885247,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*,AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAG -MK115690.1,rev_exon2,8382,8658,8376,8652,forward,0.42982806877249113,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*,GACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAG -MK115690.1,nef,8801,9425,8795,9416,forward,0.459649710885779,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*,ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA -MK115571.1,gag,579,2079,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115571.1,pol,1871,4883,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115571.1,vif,4827,5406,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115571.1,vpr,5345,5636,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115571.1,tat_exon1,5616,5835,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115571.1,rev_exon1,5755,5836,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115571.1,vpu,5847,6093,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115571.1,env,6010,8551,6223,8794,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115571.1,tat_exon2,8132,8228,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115571.1,rev_exon2,8133,8409,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115571.1,nef,8552,9167,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115514.1,gag,584,2084,789,2292,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115514.1,pol,1876,4888,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115514.1,vif,4832,5411,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115514.1,vpr,5350,5641,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115514.1,tat_exon1,5621,5840,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115514.1,rev_exon1,5760,5841,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115514.1,vpu,5852,6098,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115514.1,env,6015,8556,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115514.1,tat_exon2,8137,8233,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115514.1,rev_exon2,8138,8414,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115514.1,nef,8557,9172,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115488.1,gag,707,2207,789,2292,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115488.1,pol,1999,5011,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115488.1,vif,4955,5534,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115488.1,vpr,5473,5764,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115488.1,tat_exon1,5744,5963,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115488.1,rev_exon1,5883,5964,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115488.1,vpu,5975,6221,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115488.1,env,6138,8679,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115488.1,tat_exon2,8260,8356,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115488.1,rev_exon2,8261,8537,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115488.1,nef,8680,9295,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115030.1,gag,176,1685,789,2292,forward,0.27304152847199525,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA -MK115030.1,pol,1477,4489,2084,5096,forward,0.26443159013103534,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115030.1,vif,4433,5012,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK115030.1,vpr,4951,5242,5558,5849,forward,0.3566796368352788,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115030.1,tat_exon1,5222,5441,5829,6045,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115030.1,rev_exon1,5361,5442,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115030.1,vpu,5453,5699,6060,6309,forward,0.5682727709300466,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*,ATGCATATCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK115030.1,env,5616,8217,6223,8794,forward,0.5091484869809996,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115030.1,tat_exon2,7798,7891,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK115030.1,rev_exon2,7799,8075,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK115030.1,nef,8218,8860,8795,9416,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115498.1,gag,663,2163,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115498.1,pol,1955,4967,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115498.1,vif,4911,5490,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115498.1,vpr,5429,5720,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115498.1,tat_exon1,5700,5919,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115498.1,rev_exon1,5839,5920,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115498.1,vpu,5931,6177,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115498.1,env,6094,8635,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115498.1,tat_exon2,8216,8312,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115498.1,rev_exon2,8217,8493,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115498.1,nef,8636,9251,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115211.1,gag,250,1753,789,2292,forward,0.25132972351334526,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAGATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAAGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACACAGGACATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCATTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAGCCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAAACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAAATGCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA -MK115211.1,pol,1545,4557,2084,5096,forward,0.2540106951871657,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAGAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCTGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATTTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTACCACCTGTAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGGCAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGTAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA -MK115211.1,vif,4501,5083,5040,5619,forward,0.40472673559822736,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MK115211.1,vpr,5022,5313,5558,5849,forward,0.3808935556928146,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAG -MK115211.1,tat_exon1,5293,5512,5829,6045,forward,0.4691531785127845,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAAGACTGCTTGCACCAGTTGCTATTGTAAAAGGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA -MK115211.1,rev_exon1,5432,5513,5968,6046,forward,0.564475664826894,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG -MK115211.1,vpu,5524,5794,6060,6309,forward,0.5776066350710902,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTATTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA -MK115211.1,env,5687,8198,6223,8794,forward,0.6638103647692366,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -MK115211.1,tat_exon2,7779,7872,8375,8471,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG -MK115211.1,rev_exon2,7780,8056,8376,8652,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG -MK115211.1,nef,8199,8823,8795,9416,forward,0.5093153589821267,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA -MK115158.1,gag,316,1819,234,1731,forward,0.38499312512276596,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAACAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACCCAGGAAATAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCTTTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACGATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAACCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA -MK115158.1,pol,1611,4623,1526,4535,forward,0.30843043180260443,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTCTACCAGGAAGATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATGGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTGCATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCTCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACTTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAGGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAGGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA -MK115158.1,vif,4567,5149,4479,5061,forward,0.48399487836107546,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGTTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACGGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MK115158.1,vpr,5088,5379,5000,5291,forward,0.43053960964408733,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTGGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115158.1,tat_exon1,5359,5578,5271,5487,forward,0.4464285714285715,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA -MK115158.1,rev_exon1,5498,5579,5410,5488,forward,0.5622384937238494,MAGRSGDSDEELLKITRTIKFLYQNSE,MAGRSGDSDEELLKITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG -MK115158.1,vpu,5590,5860,5502,5748,forward,0.5374618963580942,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL*,ATGCAATCCTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTTGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA -MK115158.1,env,5753,8315,5665,8212,forward,0.5078662118966413,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTGAAAATGTTAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGGGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTATATCTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -MK115158.1,tat_exon2,7896,8004,7793,7901,forward,0.5826923076923078,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*RMDS*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAA -MK115158.1,rev_exon2,7897,8173,7794,8070,forward,0.45968205324650446,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG -MK115158.1,nef,8316,8940,8213,8834,forward,0.5254870367657829,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA -MK114705.1,gag,532,2047,789,2292,forward,0.27270615563298484,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGCGAATTAGATAGATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCGGTTAATCCTGGCCTGTTAGAAACATCAGAGGGCTGTAGGCAAATACTGGGACAGCTACAACCGTCCCTTCAAACAGGATCAGAAGAACTTAAATCATTATTTAATACAATAGCAGTCCTTTATTGCGTACATCAAAGGATAGATGTAAAAGACACCAAGGAAGCTCTAAATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGTCAGAGCAGTCAAGTCAGCCAAAATTACCCTATAGTGCAGAACCATCAGGGGCAAATGGTATATCAGGCTCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCCGAGGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAGGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGGACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCATGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTATCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCTTTTAGAGATTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAAGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTCTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCAGCCACAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGCAACAGGTGGTGCAACTAACATAATGATGCAGAAAGGCAATTTTAGGAACCAAGGAAAACCTATTAAGTGTTTCAATTGTGGCAAAGAAGGGCACCTAGCTAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCTCTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAA -MK114705.1,pol,1839,4851,2084,5096,forward,0.21944123990570308,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTAAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAACCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCCGTATTTGCCATAAAGAAAAAGGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAGCTTAATAAAAGAACTCAAGACTTTTGGGAGGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTCTCAGTTCCTTTAGATGAAAGCTTCAGAAAGTATACTGCATTTACCATACCTAGTACTAACAATGAGACACCCGGGATTAGGTATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTTCAAAGTAGCATGACGAAAATCTTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTACCAATACATGGATGATTTATACGTAGGATCTGACTTAGAAATAGAGCAGCATAGAGCAAAAGTAGAGAACCTGAGAGAGCATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAGCATCAGAAAGAACCTCCATTTCTTTGGATGGGCTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAGCTAAGGCACTAACAGAAGTGATAACACTAACAGAAGAAGCAGAGCTAGAATTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAGTAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACCTATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAAGCAGTTCAAAAAATAGCCACAGAGAGCATAGTAGTATGGGGAAAGATTCCTAAATTTAGATTACCCATACAGAAAGAAACATGGGAAACATGGTGGATGGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAGTACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGGCAAAAAGTTATCCCCTTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGACAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAGAAGGTCTACCTGACATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCAGGAATCAGGAAAATACTATTTTTGGATGGAATAGATAAGGCCCAGGAAGATCATGAGAAATATCATAGTAATTGGAAAGCAATGGCTAGTGATTTTAACATACCACCTGTGGTAGCAAAAGAGATAATAGCCAGCTGTGATAAATGTCAGCTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTCCATGTAGCCAGTGGGTACATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAATAATACATACAGATAATGGTAGCAATTTCACCAGCACTACAGTCAAGGCCGCCTGCTGGTGGGCAGGTGTTAAGCAGGAGTTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTGGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGAGTACTGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTGCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATCAAAGTAGTACCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK114705.1,vif,4795,5374,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTCTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGGTTTACAGACACCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAACACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATATGTACTATTTTGATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTGCAATACCTGGCACTAGCAGTATTAGTAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTCGCGAGACTGACAGAGGATAGATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAG -MK114705.1,vpr,5313,5598,5558,5849,forward,0.39401343921808174,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*,ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAG -MK114705.1,tat_exon1,5578,5797,5829,6045,forward,0.5138258357408172,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*,ATGGAGCCCGTAGATCCTAGACTGGAACCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTAACAATTGCTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGCTTCACAAAAAAGGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAA -MK114705.1,rev_exon1,5717,5798,5968,6046,forward,0.5940834141610087,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK,ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG -MK114705.1,vpu,5809,6055,6060,6309,forward,0.5727186311787074,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*,ATGCAACCTTTAGAGATATCAGCAATAGTAGCATTAGTAGTAGTAGCAATAATAGCAATAGTTGTGTGGACCATAGTACTCTTAGAGTATAGGAAAATATTAAGGCAAAAGAAAATAGACAGATTAATTAATAGAATAAGTGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG -MK114705.1,env,5972,8549,6223,8794,forward,0.5021538905210794,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*,ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MK114705.1,tat_exon2,8130,8226,8375,8471,forward,0.6074396517609815,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD**,AGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGA -MK114705.1,rev_exon2,8131,8407,8376,8652,forward,0.47688921496698455,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*,GACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAG -MK114705.1,nef,8550,8985,8795,9416,forward,0.6017710152157637,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*,ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAG -MK114856.1,gag,120,2022,789,2292,forward,0.7511039743075072,MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC,MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ*,ATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTGGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGTTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGGCTCAAATCTGGTCCAACCAGAGAGACCCAGTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAAAGGCGGCGACTGGTGAGTACGCCATTTTTGACTAGCAGAGGCTAGAAGGAGAAAGATAGGTGCGAGAGCGTCAGTATTGAGCAGAGGAGAATTAGATAGATAGGAGAAAATTCAGTTAAGGCCAAGGAGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAAGGAACTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGGAGGCTGTAAACAGATATTAGAACAGCTACAACCATCCCTTCAGACAAGATCAGAAGAACTTAGATCATTATATAATACAGTAGCCACCCTCTATTATGTACATCAAAAGATAGATGTAAAAGACACCAAAGAAGCGTTAGACAAAGTAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCGGCAGCTGACACAAGAAACAGAGGCCAGACCAGTCAAAATTTCCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAGGCCATATCACCTAGAACTTTAAATGCATAAGTAAAAGTAGTAGAAGAAAAAGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACTATGCTAAACACAGTAAGTAGACACCAAGCAGCTATGCAAATGTTAAAAAAGGTCATCAATGAAGAAGCTGCAGAATAAGATAGATTACATCCAGTGCATGCAAGGCCTATTGCACCAGGCCAGATAAGAGAACCAAAAAGAAGTGACATAGCAAGAACTACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAAGAAAGATTTATAAAAGATAAATAATTCTAGGACTAAATAAAATAGTAAAAATGTATAGCCCTACCAGCATTTTAGACATAAAGCAAAGGCCAAAAGAACCCTTTAGAGACTATGTAGACCAGTTCTATAAAACTTTAAGAGCCAAGCAAGCTACACAGAAAGTAAAAAATTAGATGACAAAAACCTTGTTAGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAAAAAGTAAGAAGACCCGGCCATAAAGCAAAAGTTTTAGCTGAAGCAATGAGCCAAGCAACAGGTGCAGCCAACATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAAAGCACATAGCCAAAAATTGCAAGGCCCCTAAGAAAAAAGGCTGTTAGAAATATAGAAAAGAAAGACACCAAATGAAAAATTGCACTAAGAGACAGGCTAATTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA -MK114856.1,pol,1787,4826,2084,5096,forward,0.7637180771917039,ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI,FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*,TTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAAGAGAGCAACTAAAGAAAGCTTTATTAAATACAGGAGCAGATGATACAGTATTAGAAGACATAGATTTGCCAAGAAAATAGAAACCAAAAATGATAAGAAGAATTAGAAGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCAGACACAAAGCTATAAGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTAGAAGAAATCTGTTGACTCAGCTTAGTTGCACTCTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAAGAATGGACGGCCCAAAAGTTAAACAATAGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATAGAAAAAGAAAAGAAAATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATAGAAAAAATTAGTAGATTTCAGAGAACTTAATAAGAAAACTCAAGATTTCTAAGAAATTCAATTAAGTATACCACATCCTGCAAAGCTAAAAAAGAAAAAATCAGTCACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAAGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAAAGATTAGATATCAGTATAATGTGCTTCCACAAAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTAGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAAGGCAACATAGAACAAAAGTAAAGGAACTGAGGCAACATCTAATGAGGTAAAGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTAGATGAGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAAGAAAGTTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAATTGAATTAGGCAAGTCAGATTTATGCAAAGATTAAAGTGAAGCAATTATGTAAGCTCCTTAAAAGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAAAGATTCTAAAAGATCCAGTACATAGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAAAGAGAAGGTCAGTGGACATATCAAATTTATCAAAAGCCATTTAAAAATCTAAAAACAGAGAAATATGCAAGAACGAAAGGTGCCCATACTAATGATGTAAAGCAATTAACAGAAGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATAAAGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATAAGAAACATAGTGGACAGATTATTGGCAAGCCACCTAGATCCCTAAGTAAGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATAGTACCAGTTAGAAAAAGAACCCATAATAAGAGCAGAAACCTTCTATGTAGATAAGGCAGCTAATAAAGATAATAAATCAAGAAAAGCAAGATATGTTACTGACAGAAGAAGACAAAAAGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAAGATTCAGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAAAGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGAAAAAAGTCTACCTGGCATAAGTGCCAGCCCACAAAAGAATTAAAAGAAATGAACAGGTAAATAAACTAGTCAGTGCTAGAATCAAGAAAGTACTATTTTTAGATAAAATAGAAAAAGCCCAAGAAGACCATAAAAAATATCACAGTAATTAAAGAACAATGGCTAGTAATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAAAAGAAGCTATGCATAGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAAGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAAGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTAGTAGGCAAAAATCAAGCAAGAATTTAGTATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAAAATCTATAAATAATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAG -MK114856.1,vif,4425,5349,5040,5619,forward,0.7566838361540349,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK,MN*RKL*DK*KIRLNILRQQYKWQYSSTILKEKGGLKDTVQRKE**T**QQKYRLKNYKNKLQKFKIFRFITRTAEIHFRKDQQSFSGKVKRQ**YKITVT*K*CQEEKQKSLRIIKNRWQVMIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH*,ATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAGAAATAGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGAGGTGCTAGATTAGTAATAACAACATATTAAGGTCTGCATACAGGAGAAAAAGACTGGCATTTAGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAG -MK114856.1,vpr,5033,5579,5558,5849,forward,0.7334692430420138,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*,ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAG -MK114856.1,tat_exon1,5486,5780,5829,6045,forward,0.7619181418001311,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN,ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT -MK114856.1,rev_exon1,5698,5779,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAA -MK114856.1,vpu,5790,6039,6060,6309,forward,0.7407973896196594,MQPLKILAIVALVVAAIIAIVV,MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*,ATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAG -MK114856.1,env,5953,8521,6223,8794,forward,0.7529994904340572,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*,ATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTAGAAAAATAACATGGTAGACCAGATGCATGAGGATATAATCAATTTATGAGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAAAAATAATACTGTAGGAAATCAAACAAATTATCATCTCAATGAAACTAATACAATACAAAGAAAAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAATATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAAAGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTAGTTTTGCAATTCTAAAGTGTAAAGATGAGATGTTCAATAGAACAAGACCATGTAAGAATGTCAGCACAGTACAATGTACACATAGAATTAGACCAGTAGTGTCAACTCAACTGCTGTTAAATAGTAGCCTAGCAGAAAAAAAGATAGTACTTAGATCTGAAAATTTCACAGACAATACTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAAAGAGAGCAATTTATGCAACAAGACAGATAATAGAAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGAAGTGACACTTTAAGCAAAATAGTTGAAAAATTAAAGGAAAAATTTAGAAAAAATAAAACAATAATCTTTAAGCAATCATCAAGAGAGGACATAGAAATTGAAACGCACAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGAAGTGTTAATAGAACTAGCATAAACAGAACTAACAATAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATCAACAGGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCTATCAGTAAGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATAGTAGTACAACTAATAGTAAAGAAGAGACCTTCAGACCTAGAGAAAGAAATATGAAGGACAATTAGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAAAAGTAGCACCCACCAAGGCACAAAGAAAAGTAGTGCAGAGAGAAAAAAGAGCAATAAGAACGTTAGGAGCTATGTTCCTCAGGTTCTTAAGAACAGCAGGAAGCACTATAGGCGCAGCGTCACTGACGCTGACAGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTAAGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTAGAAAGATACCTACAAGATCAACAGCTCCTGAAGATTTGAAGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATACTAGTTAGAGCAATAAATCTTACAGTACCATCTAAGATAACATGACCTAGATGCAGTAGGACAGAGAAATTCAAAATTACACAAAGATAATATACAACTTACTTAAAGAATCGCAAATCCAACAGAAAAAGAATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAA -MK114856.1,nef,7916,9176,8795,9416,forward,0.7587548638132295,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MKKNY*N*INEQICRISLV*QNGYSI*KYS****EA**V*K*FLLYFL**IELGKDTHHYHCRPSSQPQEDQTGPKE*KKKVKRETEADPED**LDSYHSSKTTCKACAFSATTT*KTYS*LC*RLCKF*DTRSKRSSSTSRVSCSIKFRN*RIVLLACSIP*LSQ*LKEQIKL*K*DKKLAELFSTYLER*DKA*KRLCNKISGK*SKSCMAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAAAATAAGTGGCAAGTAGTCAAAAAGTTGTATGGCTAGATAGCCTGCTGTAAAAGAAAGAATAGAAAGAGTTAATCCAAGGCCTGCTGCAAAGAAAGAACAAGCTGAGCCAGCAGCAGCTAAGGTAAGAGCAGCATCTCGAGACTTAGAAAAATATAGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTAGCTAGAAGCACAAGAGGAAGAAGAAGTAGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTAAATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTAGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGAAATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATAGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA -MK114856.1,tat_exon2,8102,8198,8375,8471,forward,0.7134052388289676,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED**,AGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGA -MK114856.1,rev_exon2,8103,8379,8376,8652,forward,0.6888374145157732,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*,GACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAG -MK115009.1,gag,302,1715,789,2292,forward,0.7484174646972894,MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC,MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*,ATGGGTGCTAGAGCGTCAGTATTAAGCGGCGGAAAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGAAGGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATAGTACATCAACCATTATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAAGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATAGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAAGAACCAAGAGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAAGGCTAAACAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAAGAACCCTTTAAAGATTATGTAGACCGATTCTATAAAACTCTAAAGGCTGAGCAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAAGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATAGTGCAAGGAGGCAATTTTAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAAGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAAAAATGTAGAAAGGAAAGACACCAAATGAAAGATTGTACTAAGAGACCAGACTAAGACGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGA -MK115009.1,pol,1613,4625,2084,5096,forward,0.7535201229073285,AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGAGGAAGAGGCAACAGCTCCTCCTCAGAAGCAGGAGACGAAAGACCAAGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATGATAAAAAGAATTAGAAGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACGCCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGTCAGGAATAGATAGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAGGAAAAGAAAATTACAAAAATTAGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAAAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTAAGAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGAAGTTAAATATCAGTACAATGTGCTTCCACAGAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAGGTGAGGACTCACCACACCAGACAAGAAACATCAGAAAAAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTGATAAATAGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTGAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGAGGAGAGACCAATAGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGAAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAGAAAATGTGGTGGACAAAGTATTGGCAAGCCACCTAGATTCCTGAGTAAGAATTTGTCAATACCCCTCCCTTAGTAAAACTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAAATAAGGCAGCTAATAGAAAGACTAAATTAAGAAAAGCAGAGTATGTTACGGACAGAAGAAGACAAAAGGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAGATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTGAAGGAAATGAACAAGTAGATAAATTAGTCAGTAATAGAATCAGAAGAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAGAGAGCAATGGCTAGTAATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATAGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATAGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAAGCCGCCTGTTAGTAGGCAGAGATCAAGCAGGAATTTAGTATTCCCTACAATCCTCAAAGTCAAAGAGTAGTAAAATCTATGAATAATAAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115009.1,vif,4289,4988,5040,5619,forward,0.7624714704923379,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL*KP*SKNKFRSTHPIRGSKIGNKNILRSAYRRKRLAFRPGSIHRMEEKEI*HTSRPWPGRPTNSPVLF*LFFRICYKECHIRT*S*S*V*ISGRT*,ATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATAGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATAGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGAGGAAGCAAGATTGGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAA -MK115009.1,vpr,5087,5378,5558,5849,forward,0.6737199868435482,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG -MK115009.1,tat_exon1,5235,5577,5829,6045,forward,0.6325105553751218,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115009.1,rev_exon1,5497,5578,5968,6046,forward,0.564475664826894,MAGRSRDSDEELLTAVRIIKRLYQSSK,MAGRSRDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115009.1,vpu,5589,5835,6060,6309,forward,0.6256860592755216,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*,ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG -MK115009.1,env,5752,8353,6223,8794,forward,0.7518870380010406,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATAAAGTACCTGTATAGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTAGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTAGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAACTTGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATGAAAGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTAATGTAGTACCAATAGATGAAGATAGTAAAAATACTACGGGCAAATATAAGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTAAACGGCAGTCTAGCAGAAGAAAAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATAGAACAGACATAATAAGAGATATAAGACAAGCGCATTATAACATTAGTAAGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGAAGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAGTACTTAGAATAGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAAGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTAGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTAGAGGAAGAGATATGAAGGACAATTAGAGAAGTAAATTATATAAATATAAAGTAGTCAAAATTAAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAAGGAAAAAAGAGCAATAAGACTTGAAGCTTTCTTCCTTAGGTTCTTAAGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACAGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAAAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTAAGGATTTAAAGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAAGAAAAAGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA -MK115009.1,nef,7748,8996,8795,9416,forward,0.7328145265888457,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MNKTYWH*ISRQVCKISLTLHSSYSI*KYS****EA**V*E*FLLYCL**IKLGKDTHHCHCRPSSQPREDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*KTYS*LRREL*NF*DAESKKH*SISRISCSIRVRK*RIVQLACSTPQQ*Q*LRGQIKL*KYYKEALELFSTYLHE*DRA*KRLCYKIGNKLSRRLKARWPAIKEKIRRARPVREPEPATAKVRAASRDLKRHGALTSSNTAATNADVACLEAQQKKEEVSFPVRPQVPLRPMTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*,ATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAAGGCTAGATGGCCTGCCATAAAGGAGAAAATAAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAACAGCTAAGGTAAGAGCAGCATCTCGAGACCTGAAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGAAGAAAGAAGAGGTAAGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115009.1,tat_exon2,7934,8027,8375,8471,forward,0.5633802816901408,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAG -MK115009.1,rev_exon2,7935,8211,8376,8652,forward,0.6781884553958476,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG -MK115387.1,gag,292,1795,789,2292,forward,0.25442849599155104,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAGGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACACAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAAGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCGCAGGATGTAAAAAATTGGATGACAGAAACCTTATTGGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MK115387.1,pol,1587,4599,2084,5096,forward,0.17509882471546434,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAGGGAAGATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAGAAATCAATAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAATAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATGGATGACTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTGGGGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAGACAATTATGTAAACTCCTTAAGGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGGGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGGGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATGGGATACCTGGTGGACAGAATATTGGCAAGCCACCTGGATTCCCGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAAAAAGAACCTATTGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAGGAATAATTCAAGCACAACCAGATAGGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAGGGTCTACCTTGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTCCTATTTTTGGATGGAATAGATAAGGCCCAAGAGGAGCATGAGAAATATCACAATAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAGGGAGAAGCCACGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTGGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115387.1,vif,4543,5122,5040,5619,forward,0.34158090650317496,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAGGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGCAGGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAG -MK115387.1,vpr,5061,5352,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115387.1,tat_exon1,5332,5551,5829,6045,forward,0.37688442211055273,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA -MK115387.1,rev_exon1,5471,5552,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG -MK115387.1,vpu,5563,5809,6060,6309,forward,0.5560235888795282,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*,ATGCAATCCTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTGGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAGGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG -MK115387.1,env,5726,8288,6223,8794,forward,0.5276672448389619,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115387.1,tat_exon2,7869,7965,8375,8471,forward,0.6995153473344102,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA -MK115387.1,rev_exon2,7870,8146,8376,8652,forward,0.32366339007432277,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAG -MK115387.1,nef,8289,8940,8795,9416,forward,0.4631394979345408,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA -MK115491.1,gag,521,2021,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115491.1,pol,1813,4825,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115491.1,vif,4769,5348,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115491.1,vpr,5287,5578,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115491.1,tat_exon1,5558,5777,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115491.1,rev_exon1,5697,5778,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115491.1,vpu,5789,6035,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115491.1,env,5952,8493,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115491.1,tat_exon2,8074,8170,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115491.1,rev_exon2,8075,8351,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115491.1,nef,8494,9109,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK116110.1,gag,62,1601,140,1643,forward,0.7362754920106639,MSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ,MAGSPHSLTCCHHFF*CSCWSQCF*NSLTIWVCILDQQGFCHPIFYIL*SLLGS*GFIEPVYIVSKGFLWSLFYVQNADRTIHSYYFI*SQDYPSFIDISYWDRWIICHPSYLFLKGTSSSCYITSPWFSHLAWCNRPCMHWMQSIPFCSFLIDGLF*YLHCCLMSPHCI*HGVYILWGGSFC*C*KHRYYFWAKSLFFYYFYPCI*SSR*HGLMYHLPLEVLHYRVVLADLAVISCASCCLLCFHLAFVLLFLYLI*RSLGVLYLYPLMYTIEDRYCII**FKLF*PCLEGWL*LSQYLSTAF*CF*QARINCESF*LPACPY*MF*PIFFLSSWP*PNFFPLV*FSPA*Y*RSRTHLSPSSLR*VKTFLAYSPVAEAMSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ*,ATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCTGGTCCCAATGCTTTTAAAATAGTCTTACAATCTGGGTTTGCATTTTGGACCAACAAGGTTTCTGTCATCCAATTTTTTACATCCTGTGAAGCTTGCTCGGCTCTTAGGGTTTTATAGAACCGGTCTACATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTTTTATGTCCAAAATGCTGACAGGACTATACATTCTTACTATTTTATTTAATCCCAGGATTACCCATCTTTTATAGATATCTCCTACTGGGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTGCTATATCACTTCCCCTTGGTTCTCTCATTTGGCCTGGTGCAACAGGCCCTGCATGCACTGGATGCAATCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAATATTTGCATTGCTGCTTGATGTCCCCCCACTGTATTTAGCATGGTGTTTATATCTTGTGGGGTGGCTCCTTCTGCTAATGCTGAAAACATAGGTATTACTTCTGGGCTAAAAGCCTTTTCTTCTACTACTTTTACCCATGCATTTAAAGTTCTAGGTGACATGGCCTGATGTACCATTTGCCCCTGGAGGTTTTGCACTATAGGGTAGTTTTGGCTGACCTGGCTGTTATTTCCTGCGCCAGCTGCTGCTTGCTGTGCTTTCATCTTGCTTTTGTTTTGCTCTTCCTCTATCTTATCTAGCGCTCCCTTGGTGTCTTGTATCTCTATCCTTTGATGTATACAATAGAGGACCGCTACTGTATTATATAATGATTTAAGCTCTTCTGACCCTGTTTGGAGGGATGGCTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTGCCCATACTAGATGTTTTAACCTATATTTTTTCTTTCCTCCTGGCCTTAACCGAATTTTTTCCCATTGGTCTAATTTTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGGTAAAAACTTTTTTGGCGTACTCACCAGTCGCCGAAGCAATGAGCCAAGTAAATTCAACTACCGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAAGAAGACTGTTAAGTGTTTCAACTGTGGTAAAATAGGGCATATAGCAAAAAATTGCAGGGCCCCCAGGAGAAAGGGCTGTTGGAAATGTGGACAGGAAGGACACCAGATGAAAGATTGTAGTGAGAGACAGGCTAATTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAA -MK116110.1,pol,1393,4405,1435,4447,forward,0.2475474244944199,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED*,TTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAAAAGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGTGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGATCAGATACCCATAGAAATCTATGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATTTGTTGACTCAGATTGGGTGCACTTTAAATTTTCCCATTAGTCCTATCGAAACTGTACCAGTAAGATTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAGATTTCAAAGATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAGAGAACTCAAGATTTCTGGGAAGTTCAATTGGGAATACCGCATCCCGCAGGATTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCATTAGATAAAGACTTTAGGAAGTATACTGCATTTACCATACCCAGTGTAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAGCTAGCATGACAAAAATTTTAGAGCCTTTTAGGAAGCAAAATCCAGACATGGTTATTTATCAATACATGGATGATCTATATATAGGATCTGACTTGGAATTAGGACAGCATAGGACAAAAATAGAGGAACTGAGACAACATCTATTGAGGTGGGGGTTTACCACACCAGACAAGAAGCATCAGAAAGAACCTCCATTCCTCTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAACACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTAGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAGGCAGTTATGTAAACTCCTTAGAGGAACCAAATCACTAACAGAAGTAGTACCACTAACAAGAGAGGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAATTACAAAAGCAGGGACAAGGCCAGTGGACTTATCAGATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATAAAGGGTACCCACACTAATGATGTAAAACAATTAACACAGGCTGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGACCCCATAGTAGGAGCAGAAACATTCTATGTCGATGGGGCAGCCAATAGGGATACTAAATTAGGAAAAGCAGGATATGTTACTGACAGGGGAAGACAAAAAATTGTCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTTACCTAGCTCTGCAGGATTCAGGATCAGAAGTAAACATAGTATCAGACTCACAGTATGCAATAGGAATTCTTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGACATGGGTGCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTATTATTCTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCCATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGTTAAAAGGAGAAGCCATACATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTGGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTGGCCAGTGGATATATTGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATATTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAACACAATACATACAGACAATGGCAGCAACTTCACTAGCACTGCGGTTAAAGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGGGATCAAGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGAGGTACAGTGCAGGGGAAAGAATAGTAGACATGATAGCATCAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGACTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAA -MK116110.1,vif,4349,4928,4391,4970,forward,0.4686663095875737,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAATGCATGGAAAAGCTTAGTAAAGCACCATATGCATGTTTCAAGGAAAGTTGAGAGATGGGTTTATAAACATCACTATGAAAGTACTAATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAAAAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAAGAGCTATAATACACAAGTAGACCCTGAAGTAGCAGACCAACTAATCCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAAAGCCATAGTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCCCTACAGTACTTGGCATTAGCAGCATTAGTAAAATCAAAAAAGACAAAGCCACCTTTGCCTAGCGTTACGAAGCTGACGGAGGATAGATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAG -MK116110.1,vpr,4867,5158,4909,5200,forward,0.4534005037783373,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP*,ATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGGATATGGCTTCAGAGCTTAGGACAATACGTCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTTTGCAACAAATGCTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACGAGGGAGAACAAGAAATGGAGCCAGTAGACCCTAG -MK116110.1,tat_exon1,5138,5357,5180,5399,forward,0.48719691819623834,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ*,ATGGAGCCAGTAGACCCTAGCCTAGCGCCCTGGAAGCACCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGCTATTGTAAAAAGTGCTGCTTACATTGCCAAGTTTGTTTCACAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAA -MK116110.1,rev_exon1,5277,5358,5319,5397,forward,0.4807692307692307,MAGRSGDSDEDLLKAVRLIKILYQSSK,MAGRSGDSDEDLLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAAG -MK116110.1,vpu,5369,5615,5411,5657,forward,0.46373488953730724,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL*,ATGCAATCTTTGCAAATAGGAGCAATAGTAGCATTAGTAGTAGGAACAATAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAAGAAAATAGATAGAATAATAGATAGAATAGTAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAG -MK116110.1,env,5532,8073,5574,8124,forward,0.47450452559300893,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL*,ATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAGTGCTGCAACAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACGCATGCCTGTGTACCCACGGACCCCAACCCACAAGAAGTATTATTGGGAAATGTGACAGAAGATTTTAATGCATGGAAAAATAACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTTTGTGTTATTTTGCATTGCACTGATGTCAACAATACTAGAAATGGGATGACAGGAGAACTAAAAAACTGCTCTTTCAATATCACCACAAAAATAACAAATAAGGTACAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTACCAATAAATAATAAGGATAATGATACTAGCTTTAATAATAATAGCTATAGGTTGATAAGTTGTAACACCTCAGTTATTACACAGGCTTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTACTGTACCCCGGCTGGTTATGCAATTCTAAGGTGTAACAATGAGACATTCAGTGGAAAAGGGCCATGTACAAATGTCAGCTCAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGCAGTCTAGCAAAACAGGAGGTAGTAATTAGATCTCAAAATTTCTCGGACAATGTTAAAACCATAATAGTACAGCTGAAGACCCCTGTAAAAATTAACTGTACAAGGCCCAATAACAATACAAGAAAAAGTATACATGCAGGACCAGGGAAAGTAATTTATGCAACAGGAGAAATAATAGGAGATATAAGACAAGCACATTGCAACATTAGTGCAGCAGAGTGGAATGATACTTTAGGACAGATAGTTACAAAATTACAAGAACAATTTGGGAATAAAACAATAGTCTTCAATCAATCGTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTTTACTGTAATTCAACACAACTGTTTAATAGTACTTGGAATAATAATGGTACTAATACTTGGAATAGTACAGGTAATATCACACTCCCATGTAAAATAAGGCAAATTGTAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCTCCTCCCATCCGTGGACAAATTAAATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAACGAGAGTGAGAGCGAAACCTTCAGACCTGGCGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGACTAGCACCCACTAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAACACTGGGAGCTGTGTTCCTTGGGTTCTTGGGAACAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATTAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGCAATAAATCTCTGAATGAAATTTGGGATAACATGACCTGGATGGAGTGGGAAAAAGAAATTAGTAATTACACACAATTAATATACACTTTAATTGAAGAATCGCAGAGCCAGCAAGAAAAGAATGAACAAGAATTATTGGCACTAGATAAGTGGGACAGCTTGTGGAGTTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAATAGGGTTAAGAATAGTTTTTACTGTACTTTCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTGTCATTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTAGTACAAAGAGCTTGTAGAGCTATTCTCCACATACCTGTAAGACTAAGACAAGGCTTAGAAAGAGCTTTGCTATAA -MK116110.1,tat_exon2,7654,7750,7705,7798,forward,0.4464285714285715,RPASQPRGDPTGPKESKKTVERETETDPHA,RPASQPRGDPTGPKESKKTVERETETDPHA**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAA -MK116110.1,rev_exon2,7655,7940,7706,7982,forward,0.46126825660935467,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAG -MK116110.1,nef,8074,8695,8125,8752,forward,0.437094682230869,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTGTAAGGGAAAGAATAAGAAGAGCTGGGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGACAAACATGGAGCAATCACAAGTAACAATACACCAGCTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTTAGGCCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATGATATACTCCCAGCAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGACCAGGGGTCAGGTTTCCACTGACCTTTGGATGGTGCTTCAAACTAGTACCACTTGAGACAGAGCAGGTAGAAGCGGCCACTGGAGGAGAGAACAACTGCTTGTTACACCCTTTGAACCAGCATGGGATGGATGACCCGGAGAGAGAAGTACTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAGAGCCAAAGAGCTGCATCCGGAGTACTACAAAGACTGCTGA -MK115527.1,gag,683,2183,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115527.1,pol,1975,4987,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115527.1,vif,4931,5510,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115527.1,vpr,5449,5740,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115527.1,tat_exon1,5720,5939,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115527.1,rev_exon1,5859,5940,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115527.1,vpu,5951,6197,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115527.1,env,6114,8655,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115527.1,tat_exon2,8236,8332,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115527.1,rev_exon2,8237,8513,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115527.1,nef,8656,9271,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK114997.1,gag,210,1719,789,2292,forward,0.27936962750716343,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACACAATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGCACTTTAAATGCATGGGTAAAAGTGATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGATCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCCTCCATAATGGCGCAAGGAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA -MK114997.1,pol,1511,4523,2084,5096,forward,0.26443159013103534,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAGAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGACAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACCAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTCCATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTAACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCCGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK114997.1,vif,4467,5046,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTAGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCCTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK114997.1,env,4985,8207,6223,8794,forward,0.6657028690558922,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*LRALETSRKSTYDCL*QLLL*TVLLSLPSLLHHKRLRHLLWQEEAETATKSFSQQSESSSGSTRAVSITCNACLKNSSNSRISSSNNNSNSCVVYSINRI*ENFKTKENRQVN**NKRKSRRQWQ*K*RRPGGIISTCGDGASCSLGW**YVVPTTCGSQSIMGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAGTATTACATGTAATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK114997.1,vpr,4985,5276,5558,5849,forward,0.3120665742024965,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK114997.1,tat_exon1,5256,5475,5829,6045,forward,0.4691531785127845,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK114997.1,rev_exon1,5395,5476,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK114997.1,vpu,5487,5733,6060,6309,forward,0.5568484042553192,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK114997.1,tat_exon2,7788,7881,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK114997.1,rev_exon2,7789,8065,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK114997.1,nef,8208,8850,8795,9416,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGA -MK115518.1,gag,739,2239,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115518.1,pol,2031,5043,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115518.1,vif,4987,5566,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115518.1,vpr,5505,5796,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115518.1,tat_exon1,5776,5995,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115518.1,rev_exon1,5915,5996,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115518.1,vpu,6007,6253,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115518.1,env,6170,8711,6223,8794,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115518.1,tat_exon2,8292,8388,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115518.1,rev_exon2,8293,8569,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115518.1,nef,8712,9327,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115065.1,gag,221,1730,789,2292,forward,0.2880084183556756,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCCAAGGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGCTGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA -MK115065.1,pol,1522,4534,2084,5096,forward,0.25117173416656646,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGATTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTATCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAAATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCTATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAGTGGAATCAGAAAAGTACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115065.1,vif,4478,5057,5040,5619,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG -MK115065.1,vpr,4996,5287,5558,5849,forward,0.3351206434316354,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115065.1,tat_exon1,5267,5486,5829,6045,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115065.1,rev_exon1,5406,5487,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115065.1,vpu,5498,5744,6060,6309,forward,0.5568484042553192,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG -MK115065.1,env,5661,8262,6223,8794,forward,0.5052314240113498,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -MK115065.1,tat_exon2,7843,7936,8375,8471,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG -MK115065.1,rev_exon2,7844,8120,8376,8652,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG -MK115065.1,nef,8263,8905,8795,9416,forward,0.5339772804571117,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115464.1,gag,527,2297,789,2292,forward,0.706855791962175,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGCTTCAGGCCATCCCTGGTTTGAGGGTGGGTCCCGCCGGGTCCCACCCCTTTGCACTCACGAGCCTGTCTGCCTCCTGCTGCCATCAATCACAGAGCCCAGGCTGTTCGGGCGCCACTGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGAGGCGGCGACTGGTGAGTACGCCAATTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAAGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAAGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACAAAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATAGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATAAGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATAGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCACAGGATGTAAAAAATTAGATGACAGAAACCTTATTAGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTAAGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAAGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MK115464.1,pol,2089,5101,2084,5096,forward,0.7518376924488996,AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED,FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATAAGTTTGCCAGGAAGATAGAAACCAAAAATGATAGAAGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATAACTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTAGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAACCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAAAAAAGATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAGAAAATTAGTAGATTTCAAGGAACTTAATAAAAGAACTCAAGACTTCTAAGAAGTTCAATTAAGAATACCACACCCCGCAAGGTTAAAAAAGAAGAAATCAATAACAGTACTAGATGTAGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAAGAAGTATACTGCATTTACCATACCTAGTATAAATAATAAGACACCAGAGATTAGATATCAGTACAATGTGCTTCCACAGGGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATAGATGACTTGTATGTAAGATCTGACTTAGAAATAAGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTAGAGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATAAGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTAAGAAAATTGAATTGAGCAAGTCAGATTTATGCAGAGATTAAAGTGAGACAATTATGTAAACTCCTTAAAGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAAGAAATTCTAAAAGAACCAGTACATGAAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGAGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGAGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGAGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATAAGATACCTAGTGGACAGAATATTGGCAAGCCACCTAGATTCCCGAGTAAGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATAGTACCAATTAGAAAAAGAGCCTATTGTAGGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAAAGAGACTAAATTAAGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAAGAATAATTCAAGCACAACCAGATAAGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTACCTTGCATAGGTACCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTGCTAGAATCAGGAAAGTCCTATTTTTAGATAGAATAGATAAGGCCCAAGAAGAGCATAAGAAATATCACAATAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAAAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAAAAAGAAGCCACGCATAGACAAGTAGACTGTAGTCCAAGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTAGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTAGTAGGCAAAGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAAGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115464.1,vif,5045,5624,5040,5619,forward,0.7067546928117459,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAAGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTAGGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGTCAAGGAGTCTCCATAGAATGGAAGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAG -MK115464.1,vpr,5563,5854,5558,5849,forward,0.37688442211055273,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG -MK115464.1,tat_exon1,5563,6052,5829,6045,forward,0.7571801566579635,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*IRALEASRKSA*DSLYQMLL*KMLLSLPSLFHNKRLRHLLWQEEAETATKTSSRQSDSSSTSTKAV,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTG -MK115464.1,rev_exon1,5973,6054,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG -MK115464.1,vpu,6065,6311,6060,6309,forward,0.7521692502681095,MQSLYILTIVALVVAAILAIVV,MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*,ATGCAATCTTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTAGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAAGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAG -MK115464.1,env,6228,8799,6223,8794,forward,0.7471048806788873,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA -MK115464.1,nef,8194,9451,8795,9416,forward,0.6514772974147296,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MNKNYWH*INRQVCRISLTYHNGCGI*KYS****EA**V*E*FLLYFL**IKLGKDTHHYHFRPSSQPREEPTGPKE*KKEVERETKADPVD**TDS*HLSRTIYGAYASSATTA*ATYS*L*SRLWNF*DARGKKPSNISRISCSTRVRN*RIVLSACSTPQL***LKGQIR**KYYKELVELFSTYLGE*DRA*KRLCYKIGGKWSKSSKVK*NAVKERIRRAQPTADKERAEPAADKVRAASRDLEKYGALTSKNTAATNADCAWLEAQEEEDEVGFPVRPQLPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAGTAAGGTTAAATAGAATGCAGTGAAAGAAAGAATAAGACGAGCTCAGCCAACAGCAGATAAAGAACGAGCTGAGCCAGCAGCAGATAAGGTAAGAGCAGCATCTAGAGACCTAGAAAAATATGGAGCACTTACAAGTAAGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGATGAGGTAGGTTTTCCAGTCAGACCTCAGTTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA -MK115464.1,tat_exon2,8380,8476,8375,8471,forward,0.6995153473344102,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA -MK115464.1,rev_exon2,8381,8657,8376,8652,forward,0.5716671727907683,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAG -MK115530.1,gag,746,2246,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115530.1,pol,2038,5050,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115530.1,vif,4994,5573,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115530.1,vpr,5512,5803,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115530.1,tat_exon1,5783,6002,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115530.1,rev_exon1,5922,6003,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115530.1,vpu,6014,6260,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115530.1,env,6177,8718,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115530.1,tat_exon2,8299,8395,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115530.1,rev_exon2,8300,8576,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115530.1,nef,8719,9334,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115520.1,gag,695,2195,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115520.1,pol,1986,5004,2084,5096,forward,0.6033592883813991,YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,IF*GKSGLPTKEGQGTSFRADQSQQPHQKRASGLGKRQ*LPLRSRSQETRNCIPCLPSNHSLAATPRQNKNRGAI*RSFLRYRSR*YSIRRNEFARKMETKNDRGNWRFYQSKTV*SDTHRNLWTQSYRYSINRTYTCQHNWKKSVDSAWLYLKFSH*SY*NCTSKIKARNGWPKS*TMAIDRRKNKSISRNLYRNGKGRKNFKNWA*KSIQYSSICYKEKRQY*MEKISRFQRTQ*ENSRLLGSSIRNTTSCRVKKEKISNSTGCG*CIFFNSLR*RIQEVYCIYHT*YK**DTRD*V*VQCAATGMERITSNIPK*HDKNLRAF*KAKSRYSYLSIHG*FVCRI*LRNRAA*NKNRGTKTTSVKVGTYHTRQKTSERTSIPLDGL*TPS*YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,ATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATATGGGAAATGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115520.1,vif,4948,5527,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115520.1,vpr,5466,5757,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115520.1,tat_exon1,5737,5956,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115520.1,rev_exon1,5876,5957,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115520.1,vpu,5968,6214,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115520.1,env,6131,8672,6223,8794,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115520.1,tat_exon2,8253,8349,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115520.1,rev_exon2,8254,8530,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115520.1,nef,8673,9288,8795,9416,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115503.1,gag,817,2317,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115503.1,pol,2109,5121,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115503.1,vif,5065,5644,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115503.1,vpr,5583,5874,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115503.1,tat_exon1,5854,6073,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115503.1,rev_exon1,5993,6074,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115503.1,vpu,6085,6331,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115503.1,env,6248,8789,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115503.1,tat_exon2,8370,8466,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115503.1,rev_exon2,8371,8647,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115503.1,nef,8790,9405,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115570.1,gag,687,2187,789,2292,forward,0.2967573174581697,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCGACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115570.1,pol,1979,4991,2084,5096,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115570.1,vif,4935,5514,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115570.1,vpr,5453,5744,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115570.1,tat_exon1,5724,5943,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115570.1,rev_exon1,5863,5944,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115570.1,vpu,5955,6201,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115570.1,env,6118,8659,6223,8794,forward,0.4620723847297967,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115570.1,tat_exon2,8240,8336,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115570.1,rev_exon2,8241,8517,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115570.1,nef,8660,9275,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115509.1,gag,555,2055,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115509.1,pol,1847,4859,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115509.1,vif,4803,5382,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115509.1,vpr,5321,5612,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115509.1,tat_exon1,5592,5811,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115509.1,rev_exon1,5731,5812,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115509.1,vpu,5823,6069,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115509.1,env,5986,8527,6223,8794,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115509.1,tat_exon2,8108,8204,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115509.1,rev_exon2,8109,8385,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115509.1,nef,8528,9143,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115702.1,gag,246,1782,789,2292,forward,0.35613851839948674,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGCGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAGGAAACGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGCTTCGCAGTCAACCCTGGCCTGTTAGAAACATCAGAAGGCTGCAAACAAATAATGGGACAACTCCAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAGAGGATAGATGTAAAGGATACCAAAGAAGCTTTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCCGCTGACACAGGAAACAACAGCCAAGTCAGCCAAAATTACCCCATAGTGCAGAACATGCAGGGACAAATGGTACATCAGGCCATATCACCCAGAACCCTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCATTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAGGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCAGGCAGGACCTGTTGCACCAGGCCAGATAAGGGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACACATAATCCACCCGTCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAGACTCTAAGAGCTGAGCAAGCTTCACAGGAAGTAAAAGGTTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCAGCCATAAGGCAAGGGTTTTGGCAGAAGCAATGAGCCAAGCAACAGGTGCACATGCCATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAA -MK115702.1,pol,1544,4586,2084,5096,forward,0.24526399193257942,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAAAGATAGGGGGGCAAATAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGAAATGGCGTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATAGCCATAGAAATTTGTGGACATAAAGCAATTGGTACAGTATTAGTAGGACCTACACCTGTCAATATAATTGGAAGAAATCTATTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAGTTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATAGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAGTGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGATTAAAAAAGAAAAAATCAATAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGATGAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATATTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGACGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGAGGACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAGGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAGATGGACAGTACAGCCTATAAAGCTGCCAGAGAAAGAAATCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATTAAAGTAAAACAATTATGTAAACTCCTTAGGGGAACCAAAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGAATTAATAGCAGAAATACAGAAGCAAGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCGAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAGAAAATATCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAGGAAACATGGGAAATATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTTAGTACTCCTCCCCTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCATCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATATTACTGACAGAGGAAGACAAAAGGTTGTCACCCTAAATGACACAACCAATCAAAAGACAGAGTTACAAGCAATTCTTCTAGCATTGCAGGATTCAGGATTAGAAGCAAACATAGTGACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGATCTACCTGACATGGGTACCAGCACATAAAGGAATTGGAGGAAATGAGCAAGTAGATAAATTAGTCAGTACTGGGATTAGGAAAGTATTATTTTTAGATGGAATAGATAGGGCCCAAGAAGAGCATGAGAGATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTCAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAATAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACACTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTACCACAGTTAAGGCCGCCTGTTGGTGGGCGGGGGTCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTGGTAGAATCTATGAATAAAGAATTAAAGAAAATAATAGGACAGGTCAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTTCAAAAATTCAAAACTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCGGTAGTAATACAGGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115702.1,vif,4530,5109,5040,5619,forward,0.3566796368352788,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAAGAAAACTAAGGGATGGTTTTATAGACATCACTATGAGAGCACTCATCCAAAAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTGAGTTGGTAGTAACAACATATTGGGGTTTGCAGCCAGGGGAAAGGGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAGGGAGATATAGAACACACGTGGACCCTAACCTAGCAGACCAACTAATTCATCTGCATTACTTTGATTGTTTTTCAGAATCTGCTATAAGACATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAAGAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACTAAACTAACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG -MK115702.1,vpr,5048,5339,5558,5849,forward,0.3566796368352788,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAA -MK115702.1,tat_exon1,5319,5538,5829,6045,forward,0.5237430167597767,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ*,ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAA -MK115702.1,rev_exon1,5458,5539,5968,6046,forward,0.5622384937238494,MAGRSGDGDEDLLKAVRLIKTLYQSSK,MAGRSGDGDEDLLKAVRLIKTLYQSSK,ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAAG -MK115702.1,vpu,5550,5808,6060,6309,forward,0.6039004707464695,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**,ATGTTATCTTTAGAAGTAATAGTAGCAATAACAGCATTAGTAGTAGCAGGAATAATAGCAATAGTTGTGTGGACCATAGTACTTATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAAGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA -MK115702.1,env,5716,8257,6223,8794,forward,0.5196110433453024,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*,ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA -MK115702.1,tat_exon2,7874,7970,8375,8471,forward,0.32608695652173914,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD**,AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA -MK115702.1,rev_exon2,7875,8151,8376,8652,forward,0.3471418653089562,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*,GACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAG -MK115702.1,nef,8275,8896,8795,9416,forward,0.4680383864671438,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*,ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA -MK115095.1,gag,2,1697,789,2292,forward,0.7478034493979825,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC,SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,TCTGGTTTCTCTTTCACTTTCAAGTCCCTGTTCGGGCGCCATCTAGGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCACGGCAAGAGGCGAGGCGCGGCGACTAGTGAGTACGCCGAAATTTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGGGAGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAAAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAACCCATATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAAGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAAGCTGCAGAATAAGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAGGAACCAAGAAGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATAGATAATCCTGAGGTTAAATAAAATAGTAAAAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAGGAACCCTTTAAGGATTATGTAGACCGGTTCTATAAAACTCTAAAGGCTGAACAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAAGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATGGTGCAAGGAGGCAATTTAAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAGAAATGTGGAAAGAAAGGACACCAAATGAAAGATTGTACTAAGAGACAGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA -MK115095.1,pol,1489,4501,2084,5096,forward,0.7624366800883231,KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK,FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAAGAAGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAAAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATAATAGAAGGAATTAGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAAAAATTTGTAGACATAAAGCTATAAGTACAGTATTAATAAGACCTACACCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAAGAAAGGAAAATTACAAAAATTAGGCCTAAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATAGAGAAAATTAGTAGATTTCCGAGAACTTAATAAAAGAACACAAGACTTTTAAAAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAAGAGTTAGATATCAGTACAATGTGCTTCCACAAAGATAGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAAGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAAGTAAAGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTAAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAAGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAGGAGATTCTAAAAGAACCAGTACATAGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGAGGAGACCAATGGACATATCAAATTTATCAGAAGCCATTTAAAAATCTGAAAACAAAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATAGAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAAGAAATGTAGTAGACAGAGTATTGGCAAGCCACCTAGATTCCTGAGTAGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAGAGAGACTAAATTAAGAAAAGCAAGGTATGTTACGGACAGAAGAAGACAAAAAGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAAATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTAGTAGAATCAGAAAAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAAGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAGGCCGCCTGTTAGTAGGCAAGGATCAAGCAGAAATTTAGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAAGGGGGATTGGGGGGTACAGTGCAGAGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTAGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAG -MK115095.1,vif,4445,5024,5040,5619,forward,0.7494633160752622,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGAGTTTACAGACATCACCATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAAGGGAAGCAAGATTAGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGGCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAG -MK115095.1,vpr,4963,5254,5558,5849,forward,0.4464285714285715,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAA -MK115095.1,tat_exon1,5111,5453,5829,6045,forward,0.6409453748630458,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MEILGQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPNLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAACTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCCATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA -MK115095.1,rev_exon1,5373,5454,5968,6046,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG -MK115095.1,vpu,5465,5711,6060,6309,forward,0.7521692502681095,MHALEIAAIVRLVVAAIIAIVV,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG -MK115095.1,env,5628,8229,6223,8794,forward,0.7513561129398668,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATGAGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAAGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATGAATTAAATCTAAATTGCCCTAACAATAATACTTGTAGTAATAATACTAAATATAATATGACGGAAGAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAAGTAGTGGAAATACTACAGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAAGGAGGGCATTTTATAGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTAGGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAAAGGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAAGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAATACTTAGAATGGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATAGTAAGAGCAACAATAGTAGTAATGATACAAAGACCTTCAGGCCTAGAAGAGGAGATATGAAGGACAATTAGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAGAAAGAAAAAAGAGCAATAGGACTTAGAGCTTTCTTCCTTAAGTTCTTAGGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTGAAGATTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTAATGTGCCCTAAAATGTTAGTTAGAGCCCTAGATAGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAGGAAAAAGAAATTGACAATTATACAGACACAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAA -MK115095.1,nef,7624,8872,8795,9416,forward,0.5833488893037148,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MNKTY*H*ISRQVCRISLTLHSGYSI*KYS****EA**V*E*FLLYCL**IELGRDTHHCHCRPSSQPRGDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*ETYS*LWRGL*NF*DAESKKH*SIGRISCSIRVRK*RIVQLACSTPQQ*Q*LKGQIRL*KYYKEALELFSTYLHE*DRA*KKLCYKIGNKLSRRLRARWPAIKERMRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAGGGCTAGATGGCCTGCCATAAAAGAAAGAATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA -MK115095.1,tat_exon2,7810,7903,8375,8471,forward,0.5303030303030303,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAG -MK115095.1,rev_exon2,7811,8087,8376,8652,forward,0.6667847862036381,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG -MK115490.1,gag,549,2049,789,2292,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115490.1,pol,1841,4853,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115490.1,vif,4797,5376,5040,5619,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115490.1,vpr,5315,5606,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115490.1,tat_exon1,5586,5805,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115490.1,rev_exon1,5725,5806,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115490.1,vpu,5817,6063,6060,6309,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115490.1,env,5980,8521,6223,8794,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115490.1,tat_exon2,8102,8198,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115490.1,rev_exon2,8103,8379,8376,8652,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115490.1,nef,8522,9137,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -MK115576.1,gag,468,1968,789,2292,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA -MK115576.1,pol,1760,4772,2084,5096,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MK115576.1,vif,4716,5295,5040,5619,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -MK115576.1,vpr,5234,5525,5558,5849,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MK115576.1,tat_exon1,5505,5724,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA -MK115576.1,rev_exon1,5644,5725,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -MK115576.1,vpu,5736,5982,6060,6309,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG -MK115576.1,env,5899,8440,6223,8794,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA -MK115576.1,tat_exon2,8021,8117,8375,8471,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA -MK115576.1,rev_exon2,8022,8298,8376,8652,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG -MK115576.1,nef,8441,9056,8795,9416,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA -OQ092466,gag,825,2361,789,2292,forward,0.2559303794507086,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTAGCCTGTTAGAAACAGCAGAAGGCTGTAGACAAATATTGGGACAGTTACAACCGTCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACATTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCCTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGCAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGCCAGGTTAGACACACAGGAAACAGCAGCCAGGTCAGCCAAAATTACCCTATAGTACAGAACCTTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGACTACATCCAGTGCATGCAGGGCCCATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTACACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGGGGACCCGGACATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCACGTAACAAATTCAAGTGCCATAATGATGCAGAGGGGCAATTTTAGAAACCAAAGAAAGGCTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092466,pol,2147,5165,2084,5096,forward,0.19193360134872262,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGGGCAGATGATACAGTATTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAGGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTATTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGTATGACAAAAATCTTAGAGCCTTATAGAACACGAAATCCAGAAATGGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGACTTAGAAATAGGGCAACATAGAGCAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGATTTACTACCCCAGACAAAAAACATCAAAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAAACAAAGACAGCTGGACTGTCAATGACATACAGAAACTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCGCTAACAGAAGAAGCAGAGTTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGGGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGGAAGGACAATGGACATTTCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGCGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAGGCATAGTAATATGGGGAAAAATTCCTAAATTTAGACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATACGCATTGGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTGATAAAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTGCTGGAATCAGGAAAGTATTATTTTTAGATGGAATAGAGAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGCTAAAAGGAGAAGCCATACATGGACAGGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATACGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATCCAAACCAAAGAACTACAAAAACAAATTATAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTTATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092466,vif,5109,5688,5040,5619,forward,0.24677296886864086,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAGGAAAGCTAAGGGATGGTTTTATAGACATCACTTTGAAAGCAATCATCCAAAAATAAGTTCAGAAGTACACATCCCACTGGAGGATGCTAGACTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGGGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTACTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACACATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGAGAAAGCCACCCTTGCCTAGTGTTAAGAAGCTAACAGAAGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG -OQ092466,vpr,5627,5918,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -OQ092466,tat_exon1,5898,6117,5829,6045,forward,0.40192926045016075,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ*,ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAA -OQ092466,rev_exon1,6037,6118,5968,6046,forward,0.4807692307692307,MAGRSGDSDDELLKTVRLIKVLYQSSK,MAGRSGDSDDELLKTVRLIKVLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAAG -OQ092466,vpu,6129,6375,6060,6309,forward,0.5077548005908421,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*,ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA -OQ092466,env,6292,8875,6223,8794,forward,0.48559709145147756,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*,ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -OQ092466,tat_exon2,8456,8552,8375,8471,forward,0.5303030303030303,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH**,AGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGA -OQ092466,rev_exon2,8457,8733,8376,8652,forward,0.3690449563855961,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*,GATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAG -OQ092466,nef,8876,9509,8795,9416,forward,0.411658382286489,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*,ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA -OQ092463,gag,801,2313,140,1643,forward,0.2589641434262949,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAGCGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAACACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGACCAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTCAGGAACCAGAGAAAGAATGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092463,pol,2105,5117,1435,4447,forward,0.14797358397500882,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAGTCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAGCTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAGCAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCTATAGTAGGAGCAGAAACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGACCATGAGAAATATCACAGTAATTGGAGGGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGGTATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCAGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092463,vif,5061,5640,4391,4970,forward,0.32379004771642805,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTATTCATCCAAGAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAGGAGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATCGGTATTACTTTGATTGTTTTTCAGAATCTGCCATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG -OQ092463,vpr,5579,5870,4909,5200,forward,0.34013605442176864,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTCCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAACAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAACCAGTAGATCCTAG -OQ092463,tat_exon1,5850,6069,5180,5399,forward,0.38728632478632474,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*,ATGGAACCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA -OQ092463,rev_exon1,5989,6070,5319,5397,forward,0.3620426829268293,MAGRSGDSDEELIKTVRLIKLLYQSSK,MAGRSGDSDEELIKTVRLIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG -OQ092463,vpu,6081,6330,5411,5657,forward,0.44033465433729635,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGAAATATCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG -OQ092463,env,6244,8827,5574,8124,forward,0.44564023273792597,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTATGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATACCACTAGTACCAAGAATACCACCCCTAGTACCACTGCTAGTAGCGGGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGAAGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAAGGATTCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTCTTGGAAGGATGAGTCAAATGGCACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAATAATGAGAGCAACACCACCGAGATTTTCAGACCTGAAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAGAGAAATTGACAATTACACAAGCTTGATATACACTTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGACAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCAACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -OQ092463,tat_exon2,8408,8504,7705,7798,forward,0.4918032786885247,RPTPQPRGDPTGQKESEKKVERETETDPDH,RPTPQPRGDPTGQKESEKKVERETETDPDH**,AGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA -OQ092463,rev_exon2,8409,8685,7706,7982,forward,0.3471418653089562,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG -OQ092463,nef,8828,9461,8125,8752,forward,0.33768732280275404,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGATTGCTGA -OQ092465,gag,855,2358,200,1700,forward,0.38383718162342295,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGGTGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAACTAGAACGGTTTGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAACAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGTACAGCAAGCAGCAACTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAATCTCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGACTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTGCCATAATGATGCAGAGAGGCAATTTCAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092465,pol,2150,5162,1492,4504,forward,0.21863141758600757,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTTTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAAGACAGTTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAGACTCCTTAAGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGACAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAGCTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTTTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACCACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATCCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAAGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGTGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATACCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATACACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092465,vif,5106,5685,4448,5027,forward,0.3589413907639558,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGATTTATAAGCATCACTATGACAGTATTAATCCAAAAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCAAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCGACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGGTCTCTACAGTACTTGGCACTAACAGCACTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG -OQ092465,vpr,5624,5915,4966,5257,forward,0.2400808693454637,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTACACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCCTTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -OQ092465,tat_exon1,5895,6114,5237,5456,forward,0.2515090543259557,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA -OQ092465,rev_exon1,6034,6115,5376,5454,forward,0.4807692307692307,MAGRSGDSDEELIKTVRLIKLLYQSSK,MAGRSGDSDEELIKTVRLIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG -OQ092465,vpu,6126,6375,5468,5708,forward,0.3726554787759131,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGTAATATCAGCAATAGTAGCATTAGTAGTAGTAGCGATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGGGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG -OQ092465,env,6289,8881,5631,8208,forward,0.48107374453325313,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGCGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTGTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACTGGTGCCAATAATACCACTAGTACCAATACTACCACCCCTAGTACCACTGTTAGTAGCGAGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGACGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAAACATAATAGTACATCTGAATAAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGAGCAGGTATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGGTGAAGGGTCAAACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTACTATTAACAAGAGATGGTGGTAACGAGAGCGAGACCACCGACACTGAGACCTTCAGACCTGTAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGATTAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAAATCTGACACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCAGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA -OQ092465,tat_exon2,8462,8558,7789,7885,forward,0.5337214944201844,RPTSQPRGDPTGQKESKEKVERETETDPDH,RPTSQPRGDPTGQKESKEKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA -OQ092465,rev_exon2,8463,8739,7790,8066,forward,0.41220115416323155,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG -OQ092465,nef,8882,9515,8209,8842,forward,0.3463855421686747,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTAAAATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAACCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA -OQ092462,gag,767,2270,789,2292,forward,0.316486214000789,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAGCTAAAACATATAGTATGGGCAAGCAGGGAACTAGAGCGATTTGCAGTTAATCCCGGCCTGTTAGAAACATCGGAGGGCTGTAGACAAATACTAGGGCAACTACAGCCCGCTCTTCAGACAGGATCAGAAGAACTTAAATCACTATTTCATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTGAAAGACACCAAAGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAAGAAAAGTAAGAAAAAGGCACAGCAAGCAGCCGCTGACACAGGAAATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGACAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGATAAGGCTTTCAGTCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCAGGCAGGGCCTGTTGCGCCAGGCCAGCTACGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAGCAAATAGCATGGATGACACATAATCCACCTGTCCCAGTAGGAGAAATCTATAAAAGATGGATACTTCTGGGATTAAATAAAATAGTAAGAATGTACAGCCCCGTCAGCATTCTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCTGAGCAGGCTTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAGCAAATCCAGCTAGCATAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGCCTATTAAGTGTTTCAACTGTGGCAAAGAGGGGCATATTGCTAAAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092462,pol,2062,5074,2084,5096,forward,0.1943357603710517,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTTTTAGAAGAAATGAATTTGCCAGGAAAATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGCTGCACTTTAAATTTTCCCATTAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATCTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAGAAAGATGGTAATAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCTGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAGGACTTCAGGAAGTATACTGCATTTACAATACCTAGCACAAACAATGAGACACCAGGGATTAGATACCAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTGGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATTTATCAATACATGGATGATTTATATGTAGGGTCTGACTTAGAAATAGGGCAGCATAGAGCAAAAATAGAGGAACTGAGACAACATCTATTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCCGATAAATGGACAGTACAGCCTATATTGCTGCCAGAAAAAGACAGCTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATCAAAGTAAGGCAGCTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTGGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGATTTAATAGCAGAACTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATATAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGAGGTACCCACACTAATGATATAAAACAATTAACAGAGGCAGTGCAAAAAATAGCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAATTACCCATACAAAAGGAAACATGGGAAGCATGGTGGATAGAGTATTGGCAAGCCACCTGGATTCCTGAATGGGAGTTTGTCAATACCCCTCCCTTAGTGAAACTATGGTACCAGTTGGAAAAAGAACCCATAGTGGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAAACTAAATTAGGAAAAGCAGGATATGTTACTGACAAAGGAAGACAAAAAGTTGTCCCCCTAACGGACACAACAAATCAGAAGACTGAGCTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAACTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAGTTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTATAGTAGCAAAGGAAATAGTAGCCAGTTGTGACAAATGTCAGTTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCTGGAATATGGCAGCTAGATTGTACACATCTAAAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTGAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCTGCCTGTTGGTGGGCGGGGATCAAACAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCAGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCGTCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACCAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATCAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092462,vif,5018,5597,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAGAGTTTAGTAAAACATCATATGCATATATCAAGGAAAGCTAAGAATTGGTTGTATAGACATCACTATGAAAGCATTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAGTAATAACAACATATTGGGGTCTGCTTACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAGGAGATATAGAACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCTTATTAGGACGTGTAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACCAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAG -OQ092462,vpr,5536,5827,5558,5849,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAG -OQ092462,tat_exon1,5807,6026,5829,6045,forward,0.37688442211055273,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*,ATGGATCCAGTAGATCCTAGCCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGTTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAA -OQ092462,rev_exon1,5946,6027,5968,6046,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKFLYQSSK,MAGRSGDSDEELLKAVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAAG -OQ092462,vpu,6038,6284,6060,6309,forward,0.5464940306036659,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*,ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG -OQ092462,env,6201,8778,6223,8794,forward,0.5083167934238491,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -OQ092462,tat_exon2,8359,8455,8375,8471,forward,0.4034761018001243,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH**,AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA -OQ092462,rev_exon2,8360,8636,8376,8652,forward,0.38952607660679506,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*,GACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG -OQ092462,nef,8779,9406,8795,9416,forward,0.5049429657794677,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*,ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA -OQ092464,gag,773,2276,200,1700,forward,0.3910844507174782,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAGCCAGCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATCGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCGCTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTAAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCTCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092464,pol,2068,5080,1492,4504,forward,0.21863141758600757,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAATACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAGAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGTAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAGACTACCCATACAAAGAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAGACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGACGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAGAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092464,vif,5024,5603,4448,5027,forward,0.3264662839130924,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTACTCATCCAAGAATAAGTTCAGAAGTTCACATCCCGCTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAGAAGAGATATAGCACACAAGTAGACCCTGGCTTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGCTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG -OQ092464,vpr,5542,5833,4966,5257,forward,0.2678354029705382,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -OQ092464,tat_exon1,5813,6032,5237,5456,forward,0.2515090543259557,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA -OQ092464,rev_exon1,5952,6033,5376,5454,forward,0.4807692307692307,MAGRSGDSDEELLQTVRLIKLLYQSSK,MAGRSGDSDEELLQTVRLIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG -OQ092464,vpu,6044,6290,5468,5708,forward,0.4384802297327147,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL*,ATGCAACCTTTACACATAGCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAG -OQ092464,env,6207,8790,5631,8208,forward,0.4684887834843129,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATAATACCACTAGTACCAATGATACCACTAGTACCACTACTAGTAGCGGGGAAAAGATGAAGGAAGGAGAGATAAAAAACTGCTCTTTCAATATCACCACAAGCATAAGAGATAAGGTGCAGAAAGAATATGCACTCTTTTATAAACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACGATAAGAAGTTCAATGGAACAGGATCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAATGAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAAGACAATAATCTTTACTCACTCCTCAGGAGGGGACCCAGAAGTTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGATGAAAGGTCAAATGACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGATACATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAACGAGAGCAACACCACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAAAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGGATAACATGACCTGGATGGAATGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACTTTAATTGAAAAATCGCAAAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -OQ092464,tat_exon2,8371,8467,7789,7885,forward,0.4971219256933542,RPTSQPRGDPTGQKESKKKVERETETDPDH,RPTSQPRGDPTGQKESKKKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA -OQ092464,rev_exon2,8372,8648,7790,8066,forward,0.3934495959166312,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG -OQ092464,nef,8791,9412,8209,8842,forward,0.36363636363636354,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAGAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGATGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGGTATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGGTTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA -OQ092467,gag,808,2308,789,2292,forward,0.2880084183556755,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAAAAACAATACAAATTAAAACATCTAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTTCTAGAGACATCAGAAGGGTGTAGACAAATACTGGGACAGCTACAACCAGCTCTTCAGACAGGATCAGAAGAATTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAAATAGAGGAAGAGCAAAACCAAAGTAAGAAAAAAGCAGCAGCTGCAGCAGCTGACACAGGAAACAGAAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCTTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAATAGGTGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAGGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATTCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTGAGAGCCGAGCAAGCAACACAGGAAGTAAAGAATTGGATGACAGAAACTTTGCTGGTCCAAAATGCAAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCAGGCCACAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAACTGTAATGATGCAGAGAGGCAATTTTAGGAATCAAAGAAAGACAGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCATATAGCAAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAAAGAAGGGCACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA -OQ092467,pol,2100,5112,2084,5096,forward,0.1880239208210378,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAAATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGATATGAATTTACCAGGAAAATGGAAACCAAAAATGATAGGAGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGCTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCGCATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCCTATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTACACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGGATATTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTGGGATCTGACTTAGAAATAGGACAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAAAGCTGCCAGAAAAAGATAGCTGGACTGTCAATGACATCCAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGAATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACTAAAGCACTAACAGAAGTAGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCAACGAAAGACCTAATAGCAGAACTACAGAAGCAGGGGCAAAGTCAATGGACATATCAAATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGGGGTGCCCACACTAATGATGTGAAACAATTAACAGAGGCAGTGCAAAAAATAGCCATAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAAATTACCTATACAAAAAGAAACATGGGAAACATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGATTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAAAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAGATCAGGCAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCCCCCTAACAGACACAACAAACCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTGACAGACTCACAATATGCACTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGGAAGATACTATTTTTAGATGGAATAACTAAGGCCCAAGATGATCATGAGAGATACCACAGCAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTATAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCACGCATGGACAAGTAGACTGCAGTCCAGGAATATGGCAACTAGATTGTACGCATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTAAAACTAGCAGGAAGATGGCCAGTAAAGACAGTACATACAGATAATGGCAGCAATTTCACCAGTGCTGCGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAAAGTCAAGGAGTCATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAGAAACAAATCACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAGGCAAAGATCATTAGAGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -OQ092467,vif,5056,5635,5040,5619,forward,0.41532297468972923,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATACATGTCTCAAAGAAAGCTAAGGGATGGGTTTATAGACACCACTATGAAAGCACCCATCCAAGAATAAGTTCAGAAGTACATATCCCGCTAGGGGAAGCTAGATTAGTAATAGCAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAAGAAATATATCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGCATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCATAGTAGGACGTTTAGTTAGCCCTCAGTGTGAATATCAAACAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGTAGCATTAATAACGCCAAAAAAGAGAAAGCCACCTTTGCCTAGTGTTAGGAAATTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAG -OQ092467,vpr,5574,5865,5558,5849,forward,0.3120665742024965,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAG -OQ092467,tat_exon1,5845,6064,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTCTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAA -OQ092467,rev_exon1,5984,6065,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG -OQ092467,vpu,6076,6340,6060,6309,forward,0.4955621301775147,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*,ATGCAACCCTTAGTAATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAGAAAGATAGATAGCATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG -OQ092467,env,6239,8807,6223,8794,forward,0.4703403690377699,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA -OQ092467,tat_exon2,8388,8484,8375,8471,forward,0.4918032786885247,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN**,AGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGA -OQ092467,rev_exon2,8389,8674,8376,8652,forward,0.4123815285339786,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*,GACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAG -OQ092467,nef,8808,9417,8795,9416,forward,0.484764542936288,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*,ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA +KX505501.1,env,0,1823,6223,8793,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vif,0,1823,5040,5618,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,nef,0,1823,8795,9415,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,tat_exon1,1,1749,5829,6044,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,gag,336,1823,789,2291,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon1,1306,1749,5968,6045,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,vpr,1599,1823,5558,5848,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1599,1823,6060,6308,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,pol,1627,1926,2084,5095,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,tat_exon2,1746,1823,8375,8470,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon2,1747,1926,8376,8651,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +MN691959,gag,639,2141,789,2291,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN691959,pol,1934,4945,2084,5095,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN691959,vif,4890,5468,5040,5618,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG +MN691959,vpr,5408,5698,5558,5848,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN691959,tat_exon1,5679,5894,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG +MN691959,rev_exon1,5818,5898,5968,6045,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN691959,vpu,5910,6155,6060,6308,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8655,6223,8793,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA +MN691959,tat_exon2,8237,8332,8375,8470,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8513,8376,8651,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9277,8795,9415,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,nef,0,4058,8795,9415,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG +MN692074,env,2,4114,6223,8793,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,gag,789,2291,789,2291,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692074,pol,2084,4114,2084,5095,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vif,3617,4114,5040,5618,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpr,3617,4114,5558,5848,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpu,3617,4114,6060,6308,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4083,5829,6044,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4083,5968,6045,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,tat_exon2,4080,4163,8375,8470,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4081,4152,8376,8651,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG +MN692145,gag,775,2280,789,2291,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692145,pol,2070,5084,2084,5095,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5607,5040,5618,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5837,5558,5848,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6036,5829,6044,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6037,5968,6045,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6297,6060,6308,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8782,6223,8793,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8459,8375,8470,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8640,8376,8651,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9386,8795,9415,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN090335,gag,315,1664,789,2291,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MN090335,pol,1427,4468,2084,5095,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090335,vif,4413,4991,5040,5618,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MN090335,vpr,4931,5221,5558,5848,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG +MN090335,tat_exon1,5202,5417,5829,6044,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG +MN090335,rev_exon1,5341,5421,5968,6045,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG +MN090335,vpu,5433,5681,6060,6308,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8157,6223,8793,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7834,8375,8470,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8015,8376,8651,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8812,8795,9415,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MN090376,gag,522,1589,789,2291,forward,0.6828741441147701,MYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MHTIEDCYCIK**FKFL*SCLKCWL*LSQYLSTAF*CF*QARINCESFQFPACPYYMF*LISFLSPWP*PNFLPFV*FSPA*YRRSRTHLSPSSLR*SKRRTHRSPPLASCCARFSKPSPIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGCACACAATAGAGGACTGCTACTGTATTAAATAATGATTTAAGTTCCTCTGATCCTGTCTGAAGTGCTGGTTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCCAGTTCCCTGCTTGCCCATACTATATGTTTTAACTTATATCTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATTTGTCTAATTCTCCCCCGCTTAATACCGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAAGGCGTACTCACCGTTCGCCGCCCCTCGCCTCTTGCTGTGCGCGCTTCAGCAAGCCGAGTCCGATAATTCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA +MN090376,pol,1382,4393,2084,5095,forward,0.23966680468616797,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAGAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTGACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAGACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGATGAGCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCTGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTCGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090376,vif,4338,4919,5040,5618,forward,0.42479043044174425,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAGCATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGACTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAAAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MN090376,vpr,4859,5149,5558,5848,forward,0.36116422349691957,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAAAGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCTTGGCTTCATGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN090376,tat_exon1,5130,5345,5829,6044,forward,0.46628407460545196,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAG +MN090376,rev_exon1,5269,5349,5968,6045,forward,0.5763097949886105,MAGRSGDSDEELLRIAGTIKFLYQSSK,MAGRSGDSDEELLRIAGTIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAAG +MN090376,vpu,5361,5630,6060,6308,forward,0.5680096940321115,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA +MN090376,env,5524,8109,6223,8793,forward,0.49863720871464445,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGATATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAGGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAGCCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTAACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTAACATCAATAGCACTAATATAAACAATACCAATAGTATAGAAAGAGAAATGACAAACTGCTCTTTTAATGTCACCACAGTCATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAAACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGCTATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTAAAAATGTTAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAACACAGAAGTAAATATTATCACACTCCCATGCAAGATAAGGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACATTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MN090376,tat_exon2,7691,7783,8375,8470,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MN090376,rev_exon2,7692,7967,8376,8651,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MN090376,nef,8111,8734,8795,9415,forward,0.5036770338593534,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACATCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MK115581.1,gag,680,2179,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115581.1,pol,1972,4983,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115581.1,vif,4928,5506,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115581.1,vpr,5446,5736,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115581.1,tat_exon1,5717,5935,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115581.1,rev_exon1,5856,5933,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115581.1,vpu,5948,6193,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115581.1,env,6111,8651,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115581.1,tat_exon2,8233,8328,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115581.1,rev_exon2,8234,8509,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115581.1,nef,8653,9267,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115690.1,gag,777,2285,789,2291,forward,0.24076694150363465,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAGTGGGAAAAAATTCGGTTGAGGCCAGGGGGAAAGAAAAAATATAGATTAAAGCATATCGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATAATGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTGTATAATACAGTAGCAACCCTCTATTGTGTACATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGGCGCAGGAAACAGCAGTCAGACCAGCACCAGCCAAAATTACCCTATAGTACAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTCTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACTAATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCCACCAGCATTCTAGACATAAGACAAGGACCAAAGGAGCCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTAGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAGGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGTCATAAAGCAAGAGTTTTAGCGGAAGCAATGAGCCAAGCAACAAATTCAGCTGCCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAAAGTGTTAAGTGTTTTAATTGCGGCAAAGATGGGCACATAGCAAAAAATTGCAGGGCCCCTAGAAGAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTCCAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MK115690.1,pol,2078,5089,2084,5095,forward,0.185747174550021,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGAAGATAGACCAGGACCTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGCACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATAGGGCCTGAGAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGACTTCAGAGAACTAAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGACAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAACCTTATAGAAAACAAAATCCAAACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACCTAGAAATAGGGCAGCATAGAATAAAAATAGAAGAACTGAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGACAAGTGGACAGTACAGCCTATAGCGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATCTACCCAGGAATTAAAGTAAGGCAATTATGTAAACTACTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAAAAGAAGCAGAGCTAGAATTAGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGAGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTGACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTGATATGGGGAAAGACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAATCAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTATCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACATGCAATTTATCTAGCTTTGCAAGATTCGGGATTAGAAGTAAATATAGTAACAGACTCACAGTATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTGTTTTTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAGCAGCATACTTTATTTTAAAATTAGCAGGACGATGGCCAGTAGCAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACAGTTAAGGCCGCCTGCTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAACAATGAATTGAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACGTAATAGCAACAGACTTACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAACATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115690.1,vif,5034,5612,5040,5618,forward,0.39766435115272314,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH,MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAAGATGGCACAGTTTAGTAAAACACCATATATATATTTCAGGGAAAGCTAGAGGATGGGTTTATAAACATCACTATGAAAACACTCATCCAAGAATAAGTTCAAAAGTATACATCCCACTAGGGGAAGCTAGACTGGCAGTAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAAGGAATATAGCACACAAGTAGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGTCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTTTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTATTACGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAG +MK115690.1,vpr,5552,5842,5558,5848,forward,0.37688442211055273,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS,MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS*,ATGGAACAAGCCCCAGAGAACCAAGGGCCACCGAGGGAACCATACAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACACATCTATGAGACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAAGTCTGCAACAACTGCTGTTCATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGAATTACTCCACAGAGGAGAACAAGAAATGGAGCCAGTAGATCCTAA +MK115690.1,tat_exon1,5823,6038,5829,6044,forward,0.40192926045016075,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ,ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAG +MK115690.1,rev_exon1,5962,6042,5968,6045,forward,0.524971623155505,MAGRSGDNDEDLLKTVRFIKLLYQSSK,MAGRSGDNDEDLLKTVRFIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAAG +MK115690.1,vpu,6054,6299,6060,6308,forward,0.48542752364408415,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL,MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL*,ATGCAATCTTTAGCAATATTAGCAATAGTAGCATTAGTAGTAGCAGCCATAATAGCAATAGTTGTGTGGACCATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGATAGTGGCAATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAG +MK115690.1,env,6217,8799,6223,8793,forward,0.49751604598034604,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ,MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ*,ATGAGAGTGAAGGGGATCATGAAGAATTATCAGCACTTATGGAGATGGGGCATCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCTACAGACCCCAACCCACAAGAAATAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTACATTGCACTAAGTTGGAGATTAATAGCACTAAGAAGACTAATAGCACTAATAATGGTACTAACATCAATGCCACTGATGATAGTTGGGGGGAAATGAAAAACTGCTCTTTCAATACCACTGCAAGCATAAGAGATAAGGTACAGAGAGAATTTGCGCTTTTTTATAAACTTGATATAGTACCAATAGATAATGATGATATCAACTATAGGTTAATAAGTTGTAACACCTCAGTCCTTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAAAATTTCAATGGAACAGGACAATGTAAAAATGTCAGCACAGTGCAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTCAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAAATCTGAAAATATCACAGACAATACTAAAACTATAATAGTACAGCTGAATGCATCTGTAGCAATTGTTTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGGCCAGGGAGAGCGTTTTATGCAGCAGGAGATATAATAGGAGACATAAGACGAGCACACTGTATCCTTAACAAAACAACATGGGATAACACAATAGAACAGGTAGCTAAAAAATTAAGAGAACAATTTGAGAATAAGACAATAGTCTTTAGTGAATCCTCGGGAGGGGACCCAGAAATTACAATGATTAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAGTACAACTGTTTAATAGTACTTGGCATAATAATGGGAGTAGTACTACAGGGTCAAGTAGCAGTGAAGGCAATATCACACTCCCATGCAAAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACCAATTAGCTGCGAGTCAAATATTACAGGGTTGCTACTAACAAGAGATGGTGGGAATGACGCTAACGGGAACAACACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGCGAAGTGAATTATATAGATACAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCACAGAGAAGAGTGGTACAGAGAGAAAAAAGAGCAGTGGGTCTCGGAGCCTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGCTTTGGGGTTGCTCTGGAAAACTCATCTGCAACACTGCTGTGCCTTGGAATACTAGTTGGAGTAACAAATCTCTGGATGATATTTGGCATAACATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAACATAATATACAGCTTAATTGAGGCATCGCAAACCCAGCAAGAAAAGAATGAACAAGAATTACTAGAATTAGACAAATGGGCAAGTCTGTGGAATTGGTTTAGCATATCAAACTGGCTGTGGTACATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTATACTTTCTATAGTGAATAGAGTTAGGAAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAGTGCTGTTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGAGTTATAGAAGGATTGCGCAGAGCTTTTAGAGCTATTATCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGAGCTTTGCAATAA +MK115690.1,tat_exon2,8381,8473,8375,8470,forward,0.4918032786885247,RPTSQPRGDPTGPKEPETKVESKTETDPLT,RPTSQPRGDPTGPKEPETKVESKTETDPLT*,AGACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAG +MK115690.1,rev_exon2,8382,8657,8376,8651,forward,0.42982806877249113,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE,DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE*,GACCCACCTCCCAGCCCAGAGGGGACCCGACAGGCCCGAAGGAACCGGAGACGAAGGTGGAGAGCAAGACAGAGACAGATCCACTCACTTAGTGGATGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAACCTGTGCCTCTTCCTCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATACTGGTGGAACCTTCTGCAGTATTGGAGGCGGGAACTAAAGAATAG +MK115690.1,nef,8801,9424,8795,9415,forward,0.459649710885779,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN,MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN*NC*,ATGGGTGGTAAATGGTCAAAATGTAGTATAGTTGGATGGCCTACTGTAAGGGAAAGAATAAGACGAGCAGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAAGCATGGAGCAATCACAAGTAGCAATGCTAACAATGCTGATTGTACCTGGCTGGAAGCCCAAAAAGAAGAGGAGGAGGTAGGCTTTCCAGTCAGGCCTCAGGTACCCTTAAGACCAATGACTTACAAGGCAGCCTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGAGAGGGTAGAAGAGGAGAATAAAAGAGAGAACCGCTGCTTGTTACACCCTATGAGCCAGCATGGGATGGATGACCCAGAGAAAGAAGTGCTACAGTGGAGGTTTGACAGCCGCCTAGCCTTTCACCACGTAGCCAGAGAGCTGCATCCGGAGTACTATAAGAACTAGAACTGCTGA +MK115571.1,gag,579,2078,789,2291,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115571.1,pol,1871,4882,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115571.1,vif,4827,5405,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115571.1,vpr,5345,5635,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115571.1,tat_exon1,5616,5831,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115571.1,rev_exon1,5755,5835,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115571.1,vpu,5847,6092,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115571.1,env,6010,8550,6223,8793,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115571.1,tat_exon2,8132,8227,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115571.1,rev_exon2,8133,8408,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115571.1,nef,8552,9166,8795,9415,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115514.1,gag,584,2083,789,2291,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115514.1,pol,1876,4887,2084,5095,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115514.1,vif,4832,5410,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115514.1,vpr,5350,5640,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115514.1,tat_exon1,5621,5839,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115514.1,rev_exon1,5760,5837,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115514.1,vpu,5852,6097,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115514.1,env,6015,8555,6223,8793,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115514.1,tat_exon2,8137,8232,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115514.1,rev_exon2,8138,8413,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115514.1,nef,8557,9171,8795,9415,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115488.1,gag,707,2206,789,2291,forward,0.3014827756125966,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115488.1,pol,1999,5010,2084,5095,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAATACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115488.1,vif,4955,5533,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGAGATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115488.1,vpr,5473,5763,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115488.1,tat_exon1,5744,5962,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115488.1,rev_exon1,5883,5960,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115488.1,vpu,5975,6220,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115488.1,env,6138,8678,6223,8793,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATATTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAGTCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTAAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115488.1,tat_exon2,8260,8355,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115488.1,rev_exon2,8261,8536,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115488.1,nef,8680,9294,8795,9415,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACGGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115030.1,gag,176,1684,789,2291,forward,0.27304152847199525,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK115030.1,pol,1477,4488,2084,5095,forward,0.26443159013103534,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115030.1,vif,4433,5011,5040,5618,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK115030.1,vpr,4951,5241,5558,5848,forward,0.3566796368352788,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGACATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115030.1,tat_exon1,5222,5440,5829,6044,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115030.1,rev_exon1,5361,5438,5968,6045,forward,0.4886988393402566,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115030.1,vpu,5453,5698,6060,6308,forward,0.5682727709300466,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM,MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM*,ATGCATATCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115030.1,env,5616,8216,6223,8793,forward,0.5091484869809996,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAATTATCAGCAATTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAGAAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAATACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGAAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAACCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115030.1,tat_exon2,7798,7890,8375,8470,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115030.1,rev_exon2,7799,8074,8376,8651,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115030.1,nef,8218,8859,8795,9415,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATACTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115498.1,gag,663,2162,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115498.1,pol,1955,4966,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115498.1,vif,4911,5489,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115498.1,vpr,5429,5719,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115498.1,tat_exon1,5700,5915,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115498.1,rev_exon1,5839,5919,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115498.1,vpu,5931,6176,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115498.1,env,6094,8634,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115498.1,tat_exon2,8216,8311,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115498.1,rev_exon2,8217,8492,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115498.1,nef,8636,9250,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115211.1,gag,250,1752,789,2291,forward,0.25132972351334526,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAGATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAAGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACACAGGACATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCATTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAGCCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAAACCATTTTAAAAGCATTGGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAAATGCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA +MK115211.1,pol,1545,4556,2084,5095,forward,0.2540106951871657,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAACTTTCCTCAAAGCAGGACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTCTGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAGAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCTGACATAGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATTTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAAGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTACCACCTGTAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGGCAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTGGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGTAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA +MK115211.1,vif,4501,5082,5040,5618,forward,0.40472673559822736,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGCTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACTGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MK115211.1,vpr,5022,5312,5558,5848,forward,0.3808935556928146,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTAGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAACTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGGGCAAGAAATGGAGCCAGTAGATCCTAG +MK115211.1,tat_exon1,5293,5511,5829,6044,forward,0.4691531785127845,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAAGACTGCTTGCACCAGTTGCTATTGTAAAAGGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA +MK115211.1,rev_exon1,5432,5512,5968,6045,forward,0.564475664826894,MAGRSGDSDEELLRITRTIKFLYQNSE,MAGRSGDSDEELLRITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG +MK115211.1,vpu,5524,5793,6060,6308,forward,0.5776066350710902,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL,MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL*,ATGCAATCTTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTCGTTTGGTCTATAGTATTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAA +MK115211.1,env,5687,8197,6223,8793,forward,0.6638103647692366,MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGRSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDPEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTTINNTSSIEEGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSATITQACPKVSFEPIPIH*VQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRKAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGAGGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACCCAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTACTATAAACAATACCAGTAGTATAGAAGAAGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCGCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTAGGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGAGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACACTTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTACATTTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGTAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MK115211.1,tat_exon2,7779,7871,8375,8470,forward,0.4464285714285715,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAG +MK115211.1,rev_exon2,7780,8055,8376,8651,forward,0.4267425320056898,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MK115211.1,nef,8199,8822,8795,9415,forward,0.5093153589821267,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACCCAGATAAAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MK115158.1,gag,316,1818,234,1730,forward,0.38499312512276596,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP*SQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGACAAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAACAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAACTGGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAGGAACTTAAATCATTATTTAATACAGTAGCAGTCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGACAAGATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCTGACCCAGGAAATAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCTTTTAGCCCAGAAGTAATACCCATGTTTTCAGCCTTATCAGAAGGAGCCACCCCACAAGATTTGAACACGATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACTATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCGATTGCACCAGGCCAGATGAGAGAACCGAGGGGAAGTGACATAGCAGGAACCACCAGTACCCTTCAGGAGCAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTACAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGTCCAGCAGCTACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAACTCAGCTTCCGTGATGATGCAGAAAGGCAATTTTAGGAGCCAAAGAAAGATGGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCAAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAA +MK115158.1,pol,1611,4622,1526,4534,forward,0.30843043180260443,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED,FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAACTTTCCTCAAAGCAGAACAGAACCAACAGCCCCACCAGAGGAGAGCTTCAGTTTTGGGGAAAAGACAACAACTCCTTCTCAGAAGCAGGAGCCGATAGACCAGGAACTATACCCTATGTCTTCCCTCAAATCACTCTTTGGCAACGACCCTTAGTCACAGTAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTGTTAGAAGAAATGAGTCTACCAGGAAGATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAAACAGTATGATCAGATATCAGTAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAATATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAGGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCAATAAAGAAAAAAGACAGTACTAAATGGAGAAAGTTAGTAGATTTTAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCCTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTACTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATGGTTATATATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAGTAGAGGAACTGAGACAACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAACTGCCAGAGAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAGTTGAATTGGGCAAGTCAGATTTATCCAGGGATTAAAGTAAGGCAGTTATGTAAACTACTTAGAGGAGCCAAGGCGCTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATCCTAAAAGAACCAGTGCATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAACTTGAAAACAGGAAAATATGCAAGAACAAGGGGTGCTCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATTCAAAAAGAAACATGGGAATCATGGTGGACAGAATATTGGCAAGCCACTTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACAAAATCAGGAAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAAGTTATCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGATAAAAGCGAATCAGAGTTAGTCAATCAAATAATAGAGCAATTAATACAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGGGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGAAAGGTACTATTTTTGGATGGAATAGATAAGGCCCAAGAAGATCATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACATACCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCTAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCCCCAACTTCACCAGTAATGCAGTTAAGGCCGCCTGTTGGTGGGCAGGGGTCAAACAAGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTTGTAGAATCTATGAATAAACAATTAAAACAAATTATAGGACAGGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAGGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTACCAAGAAGAAAAGCAAAAATTATTAGGGATTATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAA +MK115158.1,vif,4567,5148,4479,5060,forward,0.48399487836107546,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH,MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGGTTGTGTGGCAAGTAGACAGGATGAGGATTAACATGTGGAAAAGTTTAGTAAAATACCATATACATAATTCAGGGAAGGCTAGGGGATGGTGTTATAGACATCACTATGAAAGCAGACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGAGGAGAGGCTAGACTAGTAGTGACAACATATTGGGGCCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTAATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAATAAGGTAGGATCTCTGCAGTACTTGGCACTAATAGCATTAATACCACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTGAGGAAACGGACAGAGGATAGATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MK115158.1,vpr,5088,5378,5000,5290,forward,0.43053960964408733,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS*,ATGGAACGAGCCCCAGAGGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAACTTTTAGAAGAGCTTAAAAGAGAAGCTGTTAGGCACTTTCCTAGGGCATGGCTTCACGGCCTGGGACAACATATCTATGAAACTTATGGAGATACTTGGGCAGGAGTGGAAGCTCTAATAAGAATTCTGCAACAACTGGTGTTTATTCATTTCAGAATTGGATGTCAGCACAGCAGGATAGGCATTCTTACCCATAGAAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115158.1,tat_exon1,5359,5577,5271,5486,forward,0.4464285714285715,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGA +MK115158.1,rev_exon1,5498,5578,5410,5487,forward,0.5622384937238494,MAGRSGDSDEELLKITRTIKFLYQNSE,MAGRSGDSDEELLKITRTIKFLYQNSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAAGATAACCAGAACCATCAAGTTTCTTTATCAAAACAGTGAG +MK115158.1,vpu,5590,5859,5502,5747,forward,0.5374618963580942,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL,MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL*,ATGCAATCCTTAGAAATATTAGCAATAGTAGCATTAGTAGTAGCATTTATAATAGCAATAGTTGTTTGGTCTATAGTACTCATAGAATATAGGAAAATAAGAAGACAAAAGAGAATAGACAGGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAA +MK115158.1,env,5753,8314,5665,8211,forward,0.5078662118966413,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL,MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGACCAAGAAGAATTGGCAGCCCTCGTGGAGATGGGGAACCATGCTCATTTGGGGATGGGCCACCATGCTCCTTGGGATGTCAATGACCTGTAATGCAGAAGACTCGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCCAAAGCATATGACACAGAGGTACACAATGTCTGGGCCACACATGCTTGTGTACCCACAGACCCCAACCCACAAGAAGTAGAATTAAATGTGACAGAAAATTTTAATGCATGGAAAAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAACTGCACTGAGTTGAAGAATAGCACTGGAGAAATGAAAAACTGTTCTTTTAATGCCACCACAGCAATAAGAGATAAGGTGCAAAAACAATATGCACTTTTTTATAGACTTGATGTAGTACAAATTAAGGATGATAATACCAGCTATAATACCAGATATAGGTTGATAAATTGTAACTCCTCAACCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAATTTCAATGGAACAGGACTATGTGAAAATGTTAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTATCAACTCAACTGTTGTTAAATGGCAGTCTAGCAGAAGGAGATGTAGTAATTAGATCTAAAAATTTCTCTAACAGTGCTCAAACCATAATAGTACAATTAAACGAAACTGTAGAAATTAATTGTACAAGACCCAACAATAATACAAGAAAAAGTATACATATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGATATAAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGAGACTTTAAAAAAGATAGCTGATAAATTAAGGGAACAATTTAAAAGGGAGACAATAGTCTTTAACCAATCCTCAGGAGGGGACCCAGAGATTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACACAACTGTTTAATAGTACTTGGAATAGTACTACAGGAGTAAATGGTACAGGAGCAAATAATACAGAAGTAAATATTATCACACTCCCATGCAAGATAAAGCAAATTGTAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAGTTGTTCATCAAATATTACAGGGCTACTACTACTAAGAGATGGTGGTAATAGCAATGACACGGATAACACGACTGAAATCTTCAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTACAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAGGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCATCAATAACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATATGTTGCAGCTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTTAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTAATGTGCCTTGGAATAGTAGTTGGAGTAATAAAAATCTGAGTTATATCTGGAATAACATGACCTGGATGCAGTGGGAAAAAGAAATTGACAATTACACAGAGGAAATATACAACTTAATTGAACAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGACTTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTTATAATGATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGTTTATAGAAGTATTGCAAAGAATTTTTAGAGCTATTATCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +MK115158.1,tat_exon2,7896,8003,7793,7900,forward,0.5826923076923078,RPSSQPRGDPTGPKESEKKVERETETDPVT,RPSSQPRGDPTGPKESEKKVERETETDPVT*RMDS*,AGACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAA +MK115158.1,rev_exon2,7897,8172,7794,8069,forward,0.45968205324650446,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE,DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE*,GACCCTCCTCCCAGCCGCGAGGGGACCCGACAGGCCCGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCAGTCACTTAGCGCATGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTTCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTAGCGAGGGGAGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGCCAGGAACTAAAGAATAG +MK115158.1,nef,8316,8939,8213,8833,forward,0.5254870367657829,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC,MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC*,ATGGGAGGCATATTCTCAAAACGTAATGGGGGTGGGTGGCCTGCAATAAGGGAAAGAATGAGACGAGCTCAGCCAGCAGCAGATGGGGTAGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCTCTCACAAGTAACAATACACCAGCTAACAATGCTGATTGTGCCTGGCTGGAAGCACAGGAAGAGGGGGAAGAAGTGGGTTTCCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACATACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAACAAAGACAAGATATCCTTGATCTGTGGGTCTACAACACACAGGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAATGGAACCAGAGGATGTAGAAAAGGCCACTGAAGGAGAGGACAACATCTTGTTACACCCTGTGAACCAGCATGGGATGGACGACTCAGAGAGAGAAGTGTTAGTGTGGAAGTTTGACAGCCGCCTAGCATTCCGTCACGTGGCCCGAGAGATACATCCGGAGTACTACAAGAACTGCTGA +MK114705.1,gag,532,2046,789,2291,forward,0.27270615563298484,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGCGAATTAGATAGATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAGTTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCGGTTAATCCTGGCCTGTTAGAAACATCAGAGGGCTGTAGGCAAATACTGGGACAGCTACAACCGTCCCTTCAAACAGGATCAGAAGAACTTAAATCATTATTTAATACAATAGCAGTCCTTTATTGCGTACATCAAAGGATAGATGTAAAAGACACCAAGGAAGCTCTAAATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGTCAGAGCAGTCAAGTCAGCCAAAATTACCCTATAGTGCAGAACCATCAGGGGCAAATGGTATATCAGGCTCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCCGAGGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAGGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTACATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGGACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAAATTTATAAAAGATGGATAATCATGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTATCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCTTTTAGAGATTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAAGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTCTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCAGCCACAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGCAACAGGTGGTGCAACTAACATAATGATGCAGAAAGGCAATTTTAGGAACCAAGGAAAACCTATTAAGTGTTTCAATTGTGGCAAAGAAGGGCACCTAGCTAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCTCTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAA +MK114705.1,pol,1839,4850,2084,5095,forward,0.21944123990570308,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTCCAGAACAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAGCTCCCCCTCAGAAGCAGGAGCCGACAGACAAGGAACTGTATCCCTTCTCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAGTAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAAATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTAAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAACCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCCGTATTTGCCATAAAGAAAAAGGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAGCTTAATAAAAGAACTCAAGACTTTTGGGAGGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTCTCAGTTCCTTTAGATGAAAGCTTCAGAAAGTATACTGCATTTACCATACCTAGTACTAACAATGAGACACCCGGGATTAGGTATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTTCAAAGTAGCATGACGAAAATCTTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTACCAATACATGGATGATTTATACGTAGGATCTGACTTAGAAATAGAGCAGCATAGAGCAAAAGTAGAGAACCTGAGAGAGCATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAGCATCAGAAAGAACCTCCATTTCTTTGGATGGGCTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAGCTAAGGCACTAACAGAAGTGATAACACTAACAGAAGAAGCAGAGCTAGAATTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAGTAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACCTATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACAAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAAGCAGTTCAAAAAATAGCCACAGAGAGCATAGTAGTATGGGGAAAGATTCCTAAATTTAGATTACCCATACAGAAAGAAACATGGGAAACATGGTGGATGGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAGTACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGGCAAAAAGTTATCCCCTTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGACAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAGAAGGTCTACCTGACATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCAGGAATCAGGAAAATACTATTTTTGGATGGAATAGATAAGGCCCAGGAAGATCATGAGAAATATCATAGTAATTGGAAAGCAATGGCTAGTGATTTTAACATACCACCTGTGGTAGCAAAAGAGATAATAGCCAGCTGTGATAAATGTCAGCTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTCCATGTAGCCAGTGGGTACATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAATAATACATACAGATAATGGTAGCAATTTCACCAGCACTACAGTCAAGGCCGCCTGCTGGTGGGCAGGTGTTAAGCAGGAGTTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTGGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGAGTACTGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAGGGACCAGCAAAGCTGCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGAAATCAAAGTAGTACCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK114705.1,vif,4795,5373,5040,5618,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTCTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGGTTTACAGACACCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGGAAAAAGAGATATAACACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATATGTACTATTTTGATTGTTTTTCAGAATCTGCTATAAGACAAGCCATATTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTGCAATACCTGGCACTAGCAGTATTAGTAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTCGCGAGACTGACAGAGGATAGATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAG +MK114705.1,vpr,5313,5597,5558,5848,forward,0.39401343921808174,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS*,ATGGAACAAGCCCCGGAAGATCAAGGGCCACAGAGAGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAGCTTAAGAGGGAAGCTGTTAGACATTTTCCTAGGGAATGGCTCCATAGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGGCAGGAGTAGGAGCCATAATAAGAATACTGCAACAATTACTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGGATAGGCATACTGAGGAGAACAAGAAATGGAGCCCGTAGATCCTAG +MK114705.1,tat_exon1,5578,5796,5829,6044,forward,0.5138258357408172,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ,MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ*,ATGGAGCCCGTAGATCCTAGACTGGAACCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTAACAATTGCTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGCTTCACAAAAAAGGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAA +MK114705.1,rev_exon1,5717,5797,5968,6045,forward,0.5940834141610087,MAGRSGDRDEDLLETVRFIKFLYQNSK,MAGRSGDRDEDLLETVRFIKFLYQNSK,ATGGCAGGAAGAAGCGGCGACAGAGACGAGGACCTCCTCGAGACAGTCAGATTCATCAAGTTCCTCTACCAAAACAGTAAG +MK114705.1,vpu,5809,6054,6060,6308,forward,0.5727186311787074,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL,MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL*,ATGCAACCTTTAGAGATATCAGCAATAGTAGCATTAGTAGTAGTAGCAATAATAGCAATAGTTGTGTGGACCATAGTACTCTTAGAGTATAGGAAAATATTAAGGCAAAAGAAAATAGACAGATTAATTAATAGAATAAGTGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAG +MK114705.1,env,5972,8548,6223,8793,forward,0.5021538905210794,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL,MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL*,ATGAGAGTGACGGGGATCAAGAAGAATTGTCAGCTCTTATGGAGATGGGGCGCCTTGCTCCTTGGAATGTTGATGATCTGTAGTGCTACAAACATGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGATGCAACCACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGATACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCGACCCACAAGAAGTAGTACTGGAAAATGTGACAGAAAATTATAATATGGGAAAAAATAACATGGTGGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTACTCTTAACCCCATTCTGTGTCACTTTAAATTGCACTGATGCTAACATCACCAGCACTAATAATAGTAGAGATAAGAAGGAAGGAGAAAGTACATTGGAGGAGACGAAAGGAGAAATAAAAAACTGCTCTTTCAATATGACTTCAAGCATGAGCGATAAGTCTCAGAAACAACGTGCACTTTTTTATAAGCTTGATGTGGTACAAATAGATGAGACTAATAATAATAGTTATAGGTTGATAAGTTGTAACACCTCAGTCGTCACACAGGCTTGTCCAAAGGTATCCTTTGATCCAATCCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATAATAAGAAATTCAATGGAACAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAACCTGTAGTGTCAACCCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAAGTAATGATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTGCAGCTGAAGACACCTGTACAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGGATAAGTATGGGACCAGGGAGAGTAATTTATGCAACAGGACAAATAATAGGAGATATAAGAAAAGCACATTGCAACATTAGTAGAGCAGAATGGAATACAACTTTAAAGCAGATAGTTACACAATTAAGAAAGCAGTGGAATAGAACCATAATCTTTAACTCATCCTCAGGAGGGGACCCAGAAATTGTGATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATACAACAAAACTATTTAATAGTACTTGGCCACGTAATAGTACTTGGAATAATACTGAAGGGTCAAATGACACTGAAATAATCACACTCCCGTGCAGAATAAAACAAATTGTAAACAGGTGGCAGGAAGTAGGCAAAGCAATGTATGCCCCTCCCATCCAAGGACAAATTAGTTGTTCATCAAATATTACAGGGCTGCTACTAGTTAGAGATGGTGGAATTAACACCAGTGAGAGCAACGAGACCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAGGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATGCTGGGAGCTATGTTCCTTGGGCTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGTTGACGGTACAGACCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGACTCCTAGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAACACTAGTTGGAGTAATAGATCTTATGAAGATATTTGGAACAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAGGCTTAATATACACCTTAATTGAAAAATCGCAGAACCAGCAGGAAATAAATGAACAAGAACTATTGTCATTGGATAAGTGGGCAAGCCTGTGGAATTGGTTTAATATAACAAATTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAGTGCTATCAGCTTGCTCAACGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGAATCATAGGAGTAGTACAAAGAACTTGGAGAGCTTTTATCCACATACCTAGGAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MK114705.1,tat_exon2,8130,8225,8375,8470,forward,0.6074396517609815,RPPAQPQGDPTGPKKSKKEVEKETETDQCD,RPPAQPQGDPTGPKKSKKEVEKETETDQCD**,AGACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGA +MK114705.1,rev_exon2,8131,8406,8376,8651,forward,0.47688921496698455,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE,DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE*,GACCCCCCGCCCAGCCCCAAGGGGACCCGACAGGCCCGAAGAAATCGAAGAAGGAGGTGGAGAAAGAGACAGAGACAGATCAGTGCGATTAGTGACTGGATTCTTCGCACTTTTCTGGGACGATCTACGAAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTAATCTTGATTGTAGTGAGGGTTGTGGAAATTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAAATAAAGAATAG +MK114705.1,nef,8550,8984,8795,9415,forward,0.6017710152157637,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK,MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK*,ATGGGTGGAAAATGGTCAAAAAAGAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAAAATGAAGCGAACTGAGCCAGCAGCAGAGGGGGTGGGAGCAGCATCTCGAGACCTGGACAAATATGGAGCAATCACAAGTAGCAATACAGCACAGACCAATCCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAAGAGGTAGGCTTTCCAGTCAGACCCCAGGTACCTTTGAGACCAATGACTTACAAGGCAGCTGTGGATATGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAGAGACAAGATATCCTTGATCTGTGGATCTATCACACACAAGGCTACTTCCCTGATTGGCAAAATTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGAGGGTGCTTCAAGTAG +MK114856.1,gag,120,2021,789,2291,forward,0.7511039743075072,MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC,MLHISSCFLPVLGLSGWTRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSGSNLVQPERPSSSGARTGT*KRK*NQRRSLDAGLGLLKRARQEAKGGDW*VRHF*LAEARRRKIGARASVLSRGELDR*EKIQLRPRRKKKYRLKHIV*ASKELERFAVNPGLLETSGGCKQILEQLQPSLQTRSEELRSLYNTVATLYYVHQKIDVKDTKEALDKVEEEQNKSKKKAQQAAADTRNRGQTSQNFPIVQNLQGQIVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVSRHQAAMQMLKKVINEEAAE*DRLHPVHARPIAPGQIREPKRSDIARTTSTLQEQIR*MTHNPPIPVRKIYKR*IILGLNKIVKMYSPTSILDIKQRPKEPFRDYVDQFYKTLRAKQATQKVKN*MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC*KYRKERHQMKNCTKRQANFLKKIWPSHKGRPENFPQSRPEIPQSRPEPTAPPAPPEKSFKFEEATTPSQKQETIDKELYPLTSLRSLFGNDPSSQ*,ATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTGGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGTTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGGCTCAAATCTGGTCCAACCAGAGAGACCCAGTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAAAGGCGGCGACTGGTGAGTACGCCATTTTTGACTAGCAGAGGCTAGAAGGAGAAAGATAGGTGCGAGAGCGTCAGTATTGAGCAGAGGAGAATTAGATAGATAGGAGAAAATTCAGTTAAGGCCAAGGAGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAAGGAACTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGGAGGCTGTAAACAGATATTAGAACAGCTACAACCATCCCTTCAGACAAGATCAGAAGAACTTAGATCATTATATAATACAGTAGCCACCCTCTATTATGTACATCAAAAGATAGATGTAAAAGACACCAAAGAAGCGTTAGACAAAGTAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCGGCAGCTGACACAAGAAACAGAGGCCAGACCAGTCAAAATTTCCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAGGCCATATCACCTAGAACTTTAAATGCATAAGTAAAAGTAGTAGAAGAAAAAGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACTATGCTAAACACAGTAAGTAGACACCAAGCAGCTATGCAAATGTTAAAAAAGGTCATCAATGAAGAAGCTGCAGAATAAGATAGATTACATCCAGTGCATGCAAGGCCTATTGCACCAGGCCAGATAAGAGAACCAAAAAGAAGTGACATAGCAAGAACTACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAAGAAAGATTTATAAAAGATAAATAATTCTAGGACTAAATAAAATAGTAAAAATGTATAGCCCTACCAGCATTTTAGACATAAAGCAAAGGCCAAAAGAACCCTTTAGAGACTATGTAGACCAGTTCTATAAAACTTTAAGAGCCAAGCAAGCTACACAGAAAGTAAAAAATTAGATGACAAAAACCTTGTTAGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAAAAAGTAAGAAGACCCGGCCATAAAGCAAAAGTTTTAGCTGAAGCAATGAGCCAAGCAACAGGTGCAGCCAACATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAAAGCACATAGCCAAAAATTGCAAGGCCCCTAAGAAAAAAGGCTGTTAGAAATATAGAAAAGAAAGACACCAAATGAAAAATTGCACTAAGAGACAGGCTAATTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MK114856.1,pol,1787,4825,2084,5095,forward,0.7637180771917039,ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI,FFKENLAFPQRKARELSSKPTRNSSEQTRANSPTSPSRKELQV*RSNNSLSEAGDNRQGAVSSNFPQITLWQRPIVTIKIREQLKKALLNTGADDTVLEDIDLPRK*KPKMIRRIRSFIKVRQYEQVPIEISRHKAISTVLVGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPRMDGPKVKQ*PLTEEKIKALVEICTEIEKEKKISKIRPENPYNTPVFAIKKKDGTK*KKLVDFRELNKKTQDF*EIQLSIPHPAKLKKKKSVTVLDVGDAYFSVPLDKDFKKYTAFTIPSINNETPKIRYQYNVLPQR*KRSPAIFQSSMTKILEPFRKTNPDIVIYQYIDDLYVRSDLEIRQHRTKVKELRQHLMR*RFTTPDKKHQKEPPFL*MRYELHPDKWTVQPIVLPEKES*TVNDIQKLVRKLN*ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI*RRTPKFRLPIQKET*ET*WTDYWQAT*IPK*EFVNTPPLVKL*YQLEKEPIIRAETFYVDKAANKDNKSRKARYVTDRRRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKKKVYLA*VPAHKRIKRNEQVNKLVSARIKKVLFLDKIEKAQEDHKKYHSN*RTMASNFNLPPIVAKEIVASCDKCQLKKEAMHRQVDCSPGIWQLDCTHLEEKIILVAVHVASRYIEAEVIPAETRQETAYFILKLARRWPVKTIHTDNGRNFTSNTVKAAC**AKIKQEFSIPYNPQSQEVVKSINNELKKIIRQVKDQAKHLKTAVQMAVFIHNFKRKGGIEGYSAEERIVDIIATEIQTKELQKQITKIQNFQVYYKDSRDPL*KGPAKLLWKGEKAVVIQDNSDIKVVPRRKAKIIKDYKKQMASDDCVASRQDED*,TTTTTTAAAGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGAGAACTTTCCTCAAAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAAAGAGCTTCAAGTTTGAAGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATAGACAAGGAGCTGTATCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAAGAGAGCAACTAAAGAAAGCTTTATTAAATACAGGAGCAGATGATACAGTATTAGAAGACATAGATTTGCCAAGAAAATAGAAACCAAAAATGATAAGAAGAATTAGAAGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCAGACACAAAGCTATAAGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTAGAAGAAATCTGTTGACTCAGCTTAGTTGCACTCTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAAGAATGGACGGCCCAAAAGTTAAACAATAGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATAGAAAAAGAAAAGAAAATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATAGAAAAAATTAGTAGATTTCAGAGAACTTAATAAGAAAACTCAAGATTTCTAAGAAATTCAATTAAGTATACCACATCCTGCAAAGCTAAAAAAGAAAAAATCAGTCACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAAGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAAAGATTAGATATCAGTATAATGTGCTTCCACAAAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTAGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAAGGCAACATAGAACAAAAGTAAAGGAACTGAGGCAACATCTAATGAGGTAAAGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTAGATGAGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAAGAAAGTTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAATTGAATTAGGCAAGTCAGATTTATGCAAAGATTAAAGTGAAGCAATTATGTAAGCTCCTTAAAAGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAAAGATTCTAAAAGATCCAGTACATAGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAAAGAGAAGGTCAGTGGACATATCAAATTTATCAAAAGCCATTTAAAAATCTAAAAACAGAGAAATATGCAAGAACGAAAGGTGCCCATACTAATGATGTAAAGCAATTAACAGAAGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATAAAGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATAAGAAACATAGTGGACAGATTATTGGCAAGCCACCTAGATCCCTAAGTAAGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATAGTACCAGTTAGAAAAAGAACCCATAATAAGAGCAGAAACCTTCTATGTAGATAAGGCAGCTAATAAAGATAATAAATCAAGAAAAGCAAGATATGTTACTGACAGAAGAAGACAAAAAGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAAGATTCAGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAAAGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGAAAAAAGTCTACCTGGCATAAGTGCCAGCCCACAAAAGAATTAAAAGAAATGAACAGGTAAATAAACTAGTCAGTGCTAGAATCAAGAAAGTACTATTTTTAGATAAAATAGAAAAAGCCCAAGAAGACCATAAAAAATATCACAGTAATTAAAGAACAATGGCTAGTAATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAAAAGAAGCTATGCATAGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAAGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAAGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTAGTAGGCAAAAATCAAGCAAGAATTTAGTATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAAAATCTATAAATAATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAG +MK114856.1,vif,4425,5348,5040,5618,forward,0.7566838361540349,MIVWQVDRMKIRTWKSLVKYHMYISKKAKK,MN*RKL*DK*KIRLNILRQQYKWQYSSTILKEKGGLKDTVQRKE**T**QQKYRLKNYKNKLQKFKIFRFITRTAEIHFRKDQQSFSGKVKRQ**YKITVT*K*CQEEKQKSLRIIKNRWQVMIVWQVDRMKIRTWKSLVKYHMYISKKAKK*AYRHHYETTHPRISSEVHIPLGGARLVITTY*GLHTGEKDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVRSLQYLALTALITPKKIKPPLPSVKKLTEDR*NKPQKTKGHRKSHTMNRH*,ATGAATTAAAGAAAATTATAAGACAAGTAAAAGATCAGGCTAAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGAAGGATACAGTGCAGAGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCAGGTTTATTACAAGGACAGCAGAGATCCACTTTAGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAAAGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAAGGATTATAAAAAACAGATGGCAAGTGATGATTGTGTGGCAAGTAGACAGGATGAAGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAGAAATAGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGAGGTGCTAGATTAGTAATAACAACATATTAAGGTCTGCATACAGGAGAAAAAGACTGGCATTTAGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAG +MK114856.1,vpr,5033,5578,5558,5848,forward,0.7334692430420138,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MEKKEI*HTSRP*LSRPSNSCALF*LFFRICYKKCHIRT*S*P*V*ISSRT*QSKISTILGTNSINNTKEDKATFA*CKETDRR*IEQAPEDQRPQKEPYNE*TLELLEELKREAVRHFPRPWLQNLRQYIYETYKDTWTRVEAIIRILQQMLFIHFRIKCHHSRIGIVLQRRARNRASRS*,ATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAAGTAAGATCTCTACAATACTTGGCACTAACAGCATTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAAGATAGATAGAACAAGCCCCAGAAGACCAAAGGCCACAGAAAGAGCCATACAATGAATAGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAAACCTAAGACAATATATCTATGAAACTTATAAAGATACTTGGACAAGAGTAGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAG +MK114856.1,tat_exon1,5486,5776,5829,6044,forward,0.7619181418001311,MLFIHFRIKCHHSRIGIVLQRRARNRASRS,MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAV,ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTA +MK114856.1,rev_exon1,5698,5778,5968,6045,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAA +MK114856.1,vpu,5790,6038,6060,6308,forward,0.7407973896196594,MQPLKILAIVALVVAAIIAIVV,MQPLKILAIVALVVAAIIAIVV*TIVGIKYKKILRQRKIDRIINRIRKRAEDSGNESEKDQEELSALVVEIRHDAP*DVDDL*,ATGCAACCTTTAAAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGACCATAGTAGGCATAAAATATAAGAAAATATTAAGACAAAGAAAAATAGATAGAATAATTAATAGAATAAGAAAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAG +MK114856.1,env,5953,8520,6223,8793,forward,0.7529994904340572,MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD,MRAKKIRKNCQHL**K*GTMLLKMLMICSAAENL*VTVYYEVPV*RDANTTLFCASDAKAYDTEVHNV*ATHACVPTDPNPHEVELKNVTENFNM*KNNMVDQMHEDIINL*DQSLKPCAKLTPLCVTLNCTDLKNNTVGNQTNYHLNETNTIQRKEMTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD*SDTLSKIVEKLKEKFRKNKTIIFKQSSREDIEIETHSFNCREEFFYCNTTRLFNST*SVNRTSINRTNNKNITLPCRIKQIINRWQEVRKAMYAPPISKIIRCSSNITGLILTRDSSTTNSKEETFRPRERNMKDN*RSELYKYKVVKIEPLKVAPTKAQRKVVQREKRAIRTLGAMFLRFLRTAGSTIGAASLTLTVQARQLLSGIVQQQNNLLKAIEAQQHMLQLTV*GIKQLQARVLSVERYLQDQQLLKI*SCSRKLICTTTVP*NTS*SNKSYSTI*DNMT*MQ*DREIQNYTKIIYNLLKESQIQQKKNEKELLELDQ*ANL*N*FSITKWL*YIKIFIMIVGGLVSLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRRPDRPERIEEEGEKRDRGRSRRLVTRFLPLI*DDLQSLCLFSYHHLKDLLLIVLKTVQILGHKK*EILKY**SLLQY*IQELKNSAVSLLNTIAIAVAERTDKVIEVRQKISRAFLHIPRKIRQGLEKALQ*,ATGAGAGCGAAAAAGATCAGGAAGAATTGTCAGCACTTGTAGTAGAAATAAGGCACGATGCTCCTTAAGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTAAGTCACAGTCTATTATGAGGTACCTGTGTAAAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTAGAAAAATAACATGGTAGACCAGATGCATGAGGATATAATCAATTTATGAGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAAAAATAATACTGTAGGAAATCAAACAAATTATCATCTCAATGAAACTAATACAATACAAAGAAAAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAATATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAAAGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTAGTTTTGCAATTCTAAAGTGTAAAGATGAGATGTTCAATAGAACAAGACCATGTAAGAATGTCAGCACAGTACAATGTACACATAGAATTAGACCAGTAGTGTCAACTCAACTGCTGTTAAATAGTAGCCTAGCAGAAAAAAAGATAGTACTTAGATCTGAAAATTTCACAGACAATACTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAAAGAGAGCAATTTATGCAACAAGACAGATAATAGAAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGAAGTGACACTTTAAGCAAAATAGTTGAAAAATTAAAGGAAAAATTTAGAAAAAATAAAACAATAATCTTTAAGCAATCATCAAGAGAGGACATAGAAATTGAAACGCACAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGAAGTGTTAATAGAACTAGCATAAACAGAACTAACAATAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATCAACAGGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCTATCAGTAAGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATAGTAGTACAACTAATAGTAAAGAAGAGACCTTCAGACCTAGAGAAAGAAATATGAAGGACAATTAGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAAAAGTAGCACCCACCAAGGCACAAAGAAAAGTAGTGCAGAGAGAAAAAAGAGCAATAAGAACGTTAGGAGCTATGTTCCTCAGGTTCTTAAGAACAGCAGGAAGCACTATAGGCGCAGCGTCACTGACGCTGACAGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTAAGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTAGAAAGATACCTACAAGATCAACAGCTCCTGAAGATTTGAAGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATACTAGTTAGAGCAATAAATCTTACAGTACCATCTAAGATAACATGACCTAGATGCAGTAGGACAGAGAAATTCAAAATTACACAAAGATAATATACAACTTACTTAAAGAATCGCAAATCCAACAGAAAAAGAATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAA +MK114856.1,nef,7916,9175,8795,9415,forward,0.7587548638132295,MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MKKNY*N*INEQICRISLV*QNGYSI*KYS****EA**V*K*FLLYFL**IELGKDTHHYHCRPSSQPQEDQTGPKE*KKKVKRETEADPED**LDSYHSSKTTCKACAFSATTT*KTYS*LC*RLCKF*DTRSKRSSSTSRVSCSIKFRN*RIVLLACSIP*LSQ*LKEQIKL*K*DKKLAELFSTYLER*DKA*KRLCNKISGK*SKSCMAR*PAVKERIERVNPRPAAKKEQAEPAAAKVRAASRDLEKYRAITSSNTSTTNAACA*LEAQEEEEVGFPVRPQVPLRPMTYKAALNLSHFLKEKGGLEGLI*SQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRNPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGAAAAAGAATTATTAGAACTAGATCAATGAGCAAATTTGTAGAATTAGTTTAGTATAACAAAATGGCTATAGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAAGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAAAGAACAGATAAAGTTATAGAAGTAAGACAAAAAATTAGCAGAGCTTTTCTCCACATACCTAGAAAGATAAGACAAGGCTTAGAAAAGGCTTTGCAATAAAATAAGTGGCAAGTAGTCAAAAAGTTGTATGGCTAGATAGCCTGCTGTAAAAGAAAGAATAGAAAGAGTTAATCCAAGGCCTGCTGCAAAGAAAGAACAAGCTGAGCCAGCAGCAGCTAAGGTAAGAGCAGCATCTCGAGACTTAGAAAAATATAGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTAGCTAGAAGCACAAGAGGAAGAAGAAGTAGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTAAATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTAGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGAAATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATAGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +MK114856.1,tat_exon2,8102,8197,8375,8470,forward,0.7134052388289676,RPSSQPQEDQTGPKE,RPSSQPQEDQTGPKE*KKKVKRETEADPED**,AGACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGA +MK114856.1,rev_exon2,8103,8378,8376,8651,forward,0.6888374145157732,ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE,DPPPNPKKTRQARKNRRRR*KERQRQIQKISD*ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE*,GACCCTCCTCCCAACCCCAAGAAGACCAGACAGGCCCGAAAGAATAGAAGAAGAAGGTGAAAAGAGAGACAGAGGCAGATCCAGAAGATTAGTGACTAGATTCTTACCACTCATCTAAGACGACCTGCAAAGCCTGTGCCTTTTCAGCTACCACCACTTAAAAGACTTACTCTTGATTGTGCTGAAGACTGTGCAAATTCTAGGACACAAGAAGTAAGAGATCCTCAAGTACTAGTAGAGTCTCCTGCAGTATTAAATTCAGGAACTAAAGAATAG +MK115009.1,gag,302,1714,789,2291,forward,0.7484174646972894,MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC,MGARASVLSGGKLDR*EKIYLRPEGKKKYRLKHIV*ASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPLSPRTLNA*VKVIEEKAFSPEVIPMFSALSERATPQDLNTMLNTVRGHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRGSDIAGTTSTLQEQIR*MTHNPPIPVGEIYKRWIILRLNKIVRMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC*KCRKERHQMKDCTKRPD*DG*FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*,ATGGGTGCTAGAGCGTCAGTATTAAGCGGCGGAAAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGAAGGAAAGAAAAAATATAGATTAAAACATATAGTATAGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATAGTACATCAACCATTATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAAGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATAGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAAGAACCAAGAGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACACATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAAGGCTAAACAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAAGAACCCTTTAAAGATTATGTAGACCGATTCTATAAAACTCTAAAGGCTGAGCAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAAGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATAGTGCAAGGAGGCAATTTTAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAAGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAAAAATGTAGAAAGGAAAGACACCAAATGAAAGATTGTACTAAGAGACCAGACTAAGACGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGA +MK115009.1,pol,1613,4624,2084,5095,forward,0.7535201229073285,AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,FFKEDLAFPQGKAREFSPEQTRANSPASRELQV*GRGNSSSSEAGDERPRTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEINLPGK*KPKMIKRIRSFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKSGIDSPRVKQWPLTEEKIKALIEICAEIEKEKKITKIRPENPYNTPVFAIKKKDSTK*KKLVDFRELNKRTQDF*EVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPEVKYQYNVLPQR*KRSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLR*GLTTPDKKHQKKPPFL*ISYELHPDK*TVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQRRDQ*TYQIYQEPFKNLKTEKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*KMWWTKYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVNKAANRKTKLRKAEYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIEGNEQVDKLVSNRIRRVLFLDRIDKAQEEHEKYHSN*RAMASNFNLPPVVAKEIVASCDKCQLKGEPMHRQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGR*PVKIIHTDNGSNFTSTTVKAAC**AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGAGGAAGAGGCAACAGCTCCTCCTCAGAAGCAGGAGACGAAAGACCAAGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATGATAAAAAGAATTAGAAGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACGCCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGTCAGGAATAGATAGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAGGAAAAGAAAATTACAAAAATTAGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAAAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTAAGAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGAAGTTAAATATCAGTACAATGTGCTTCCACAGAGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAGGTGAGGACTCACCACACCAGACAAGAAACATCAGAAAAAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTGATAAATAGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTGAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGAGGAGAGACCAATAGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGAAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAGAAAATGTGGTGGACAAAGTATTGGCAAGCCACCTAGATTCCTGAGTAAGAATTTGTCAATACCCCTCCCTTAGTAAAACTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAAATAAGGCAGCTAATAGAAAGACTAAATTAAGAAAAGCAGAGTATGTTACGGACAGAAGAAGACAAAAGGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAGATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTGAAGGAAATGAACAAGTAGATAAATTAGTCAGTAATAGAATCAGAAGAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAGAGAGCAATGGCTAGTAATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATAGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATAGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAAGCCGCCTGTTAGTAGGCAGAGATCAAGCAGGAATTTAGTATTCCCTACAATCCTCAAAGTCAAAGAGTAGTAAAATCTATGAATAATAAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115009.1,vif,4289,4987,5040,5618,forward,0.7624714704923379,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED,MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED*NIEQFSKTPYAYFKESSEIGLQTSL*KP*SKNKFRSTHPIRGSKIGNKNILRSAYRRKRLAFRPGSIHRMEEKEI*HTSRPWPGRPTNSPVLF*LFFRICYKECHIRT*S*S*V*ISGRT*,ATGGCAGTATTCATTCATAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGAGATTATAGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATAGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATAGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGAGGAAGCAAGATTGGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAA +MK115009.1,vpr,5087,5377,5558,5848,forward,0.6737199868435482,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT,MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT*AEVEAIIRTLQQLLFIHFRIRCQHSRIGIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATAAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG +MK115009.1,tat_exon1,5235,5573,5829,6044,forward,0.6325105553751218,MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ,ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG +MK115009.1,rev_exon1,5497,5577,5968,6045,forward,0.564475664826894,MAGRSRDSDEELLTAVRIIKRLYQSSK,MAGRSRDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK115009.1,vpu,5589,5834,6060,6308,forward,0.6256860592755216,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP,MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP*DSNDM*,ATGCATGCCTTAGAAATAGCAGCAATAGCAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAG +MK115009.1,env,5752,8352,6223,8793,forward,0.7518870380010406,MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD,MRVTRTKRNYPHLWR*GILFLKIVMICSANNL*VTVYYKVPV*KEATTTLFCASDAKAYETEKHNV*ATHACVPTDPSPQEVALENVTETFNM*KNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDNLNLTCPNNNTCSNNTNYNMKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD*NDTLKQIVIKLKEKFKNKTIVFTQSSGEDPEIVMHSFNCREEFFYCNTTQLFNST*NNST*NSTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQRQIRCSSNITGLLLVRDGRSNNSSNDTETFRPRGRDMKDN*RSKLYKYKVVKIKPLRIAPTHAKRRVVQKEKRAIRLEAFFLRFLRAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQAKVLALERYLKDQQLLRI*SCSGKLICTTNVPWNISWSPRWNRSLDKI*TNMT*KQ*EKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQ*L*YIKIFIIIVRGLISLRIVFTILSIVNKVRQGYSPLSLQTLLPTQRGPDRPERTEERGRKKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLKDLLLIAARIVELLGRRK*EALKY**NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAGAGTGACGAGGACCAAGAGGAATTATCCGCACTTGTGGAGATGAGGCATCTTGTTCCTTAAGATAGTAATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATAAAGTACCTGTATAGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTAGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTAGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAACTTGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATGAAAGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTAATGTAGTACCAATAGATGAAGATAGTAAAAATACTACGGGCAAATATAAGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTAAACGGCAGTCTAGCAGAAGAAAAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATAGAACAGACATAATAAGAGATATAAGACAAGCGCATTATAACATTAGTAAGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGAAGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAGTACTTAGAATAGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAAGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTAGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTAGAGGAAGAGATATGAAGGACAATTAGAGAAGTAAATTATATAAATATAAAGTAGTCAAAATTAAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAAGGAAAAAAGAGCAATAAGACTTGAAGCTTTCTTCCTTAGGTTCTTAAGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACAGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAAAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTAAGGATTTAAAGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAAGAAAAAGAAATTGACAATTACACAGACATAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA +MK115009.1,nef,7748,8995,8795,9415,forward,0.7328145265888457,MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR,MNKTYWH*ISRQVCKISLTLHSSYSI*KYS****EA**V*E*FLLYCL**IKLGKDTHHCHCRPSSQPREDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*KTYS*LRREL*NF*DAESKKH*SISRISCSIRVRK*RIVQLACSTPQQ*Q*LRGQIKL*KYYKEALELFSTYLHE*DRA*KRLCYKIGNKLSRRLKARWPAIKEKIRRARPVREPEPATAKVRAASRDLKRHGALTSSNTAATNADVACLEAQQKKEEVSFPVRPQVPLRPMTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR*CFKLVPVDPDKVEEASVRENNCLLSPENLHRMEDEHREVLQWRFDSRLAFHHIARELHPEYYKDC*,ATGAACAAGACTTATTGGCATTAGATAAGTAGGCAAGTTTGTAAAATTAGTTTGACATTACACAGTAGCTATAGTATATAAAAATATTCATAATAATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGAGGACAGATAAAATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAAGGCTAGATGGCCTGCCATAAAGGAGAAAATAAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAACAGCTAAGGTAAGAGCAGCATCTCGAGACCTGAAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGAAGAAAGAAGAGGTAAGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGAGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAAGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATAGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAAGTAGAAGAGGCCAGTGTAAGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACATAGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115009.1,tat_exon2,7934,8026,8375,8470,forward,0.5633802816901408,RPSSQPREDPTGPKEQKKEVERKTEAHPRD,RPSSQPREDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAG +MK115009.1,rev_exon2,7935,8210,8376,8651,forward,0.6781884553958476,ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE,DPPPNPERTRQARKNRRKR*KERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGAGGACCCGACAGGCCCGAAAGAACAGAAGAAAGAGGTAGAAAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAAAGACTTACTCTTAATTGCGGCGAGAATTGTAGAACTTCTAGGACGCAGAAAGTAAGAAGCACTGAAGTATTAGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115387.1,gag,292,1794,789,2291,forward,0.25442849599155104,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAGGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACACAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATGGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAAGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCGCAGGATGTAAAAAATTGGATGACAGAAACCTTATTGGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MK115387.1,pol,1587,4598,2084,5095,forward,0.17509882471546434,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTCCAAGGGAAGGCCAGGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAGGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTGGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAGGGAAGATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACACCCCGCAGGGTTAAAAAAGAAGAAATCAATAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAATAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATGGATGACTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTGGGGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAGACAATTATGTAAACTCCTTAAGGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGGGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGGGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATGGGATACCTGGTGGACAGAATATTGGCAAGCCACCTGGATTCCCGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAAAAAGAACCTATTGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAGGAATAATTCAAGCACAACCAGATAGGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAGGGTCTACCTTGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTCCTATTTTTGGATGGAATAGATAAGGCCCAAGAGGAGCATGAGAAATATCACAATAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAGGGAGAAGCCACGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTGGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115387.1,vif,4543,5121,5040,5618,forward,0.34158090650317496,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAGGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAAGGAGTCTCCATAGAATGCAGGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAG +MK115387.1,vpr,5061,5351,5558,5848,forward,0.2608047690014903,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTGGGACAACATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115387.1,tat_exon1,5332,5550,5829,6044,forward,0.37688442211055273,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ,MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGA +MK115387.1,rev_exon1,5471,5551,5968,6045,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKYLYQSSE,MAGRSGDSDEDLLKTVRLIKYLYQSSE,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG +MK115387.1,vpu,5563,5808,6060,6308,forward,0.5560235888795282,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL,MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL*,ATGCAATCCTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTGGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAGGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAG +MK115387.1,env,5726,8287,6223,8793,forward,0.5276672448389619,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL,MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCATGCTCCTTGGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGGAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTACTTGGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATGAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAGAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAGGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATGGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAGGAAGCCATACAAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAGGACCAGGGAGAGCATTTTACACAACAGGAGATATAATAGGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAATAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAGGGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAGGGGAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTGGACTAAAAATGGTACTGGTAGTTGGCAGTCTAATGATACTCAGAATGGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGGAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGTGGACAAATTAACTGTACATCAAATATTACAGGGCTGGTTTTAACAAGAGATGGGGGGAAGGTGATTAATGAAACTGAGACCTTTAGACCTGGAGGAGGAAATATGAAGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAAAGAGAGAAAAGAGCAGTAGGACTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCCGGAAGCACTATGGGCGCAGCGTCAATAGCGCTGACGGAACAGGCCAGACGAGTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTGGGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATCGTAGTTGGGGTGGGCATAACAAAAATCTAGATGACATTTGGGGTAACATGACCTGGATGGAGTGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAGAAAAGAATGAACAAGAATTATTGGCATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAGGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAGGGACAGATAGGATAATAGAAATATTACAAAGAATTGGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115387.1,tat_exon2,7869,7964,8375,8470,forward,0.6995153473344102,RPSSQLRGEPTGPKE,RPSSQLRGEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115387.1,rev_exon2,7870,8145,8376,8651,forward,0.32366339007432277,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE,DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCTCCGAGGGGAGCCGACAGGCCCGAAGGAATAGAAGAAGGAGGTGGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTGGGACGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAATAG +MK115387.1,nef,8289,8939,8795,9415,forward,0.4631394979345408,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTAGGGTTGGATGGAATGCAGTGAGGGAAAGAATGAGACGAGCTCAGCCAACAGCAGATAGGGAACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAATATGGAGCACTTACAAGTAGGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGATGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATGGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGGTTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA +MK115491.1,gag,521,2020,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115491.1,pol,1813,4824,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115491.1,vif,4769,5347,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115491.1,vpr,5287,5577,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115491.1,tat_exon1,5558,5776,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115491.1,rev_exon1,5697,5774,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115491.1,vpu,5789,6034,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115491.1,env,5952,8492,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115491.1,tat_exon2,8074,8169,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115491.1,rev_exon2,8075,8350,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115491.1,nef,8494,9108,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK116110.1,gag,62,1600,140,1642,forward,0.7362754920106639,MSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ,MAGSPHSLTCCHHFF*CSCWSQCF*NSLTIWVCILDQQGFCHPIFYIL*SLLGS*GFIEPVYIVSKGFLWSLFYVQNADRTIHSYYFI*SQDYPSFIDISYWDRWIICHPSYLFLKGTSSSCYITSPWFSHLAWCNRPCMHWMQSIPFCSFLIDGLF*YLHCCLMSPHCI*HGVYILWGGSFC*C*KHRYYFWAKSLFFYYFYPCI*SSR*HGLMYHLPLEVLHYRVVLADLAVISCASCCLLCFHLAFVLLFLYLI*RSLGVLYLYPLMYTIEDRYCII**FKLF*PCLEGWL*LSQYLSTAF*CF*QARINCESF*LPACPY*MF*PIFFLSSWP*PNFFPLV*FSPA*Y*RSRTHLSPSSLR*VKTFLAYSPVAEAMSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ*,ATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCTGGTCCCAATGCTTTTAAAATAGTCTTACAATCTGGGTTTGCATTTTGGACCAACAAGGTTTCTGTCATCCAATTTTTTACATCCTGTGAAGCTTGCTCGGCTCTTAGGGTTTTATAGAACCGGTCTACATAGTCTCTAAAGGGTTCCTTTGGTCCTTGTTTTATGTCCAAAATGCTGACAGGACTATACATTCTTACTATTTTATTTAATCCCAGGATTACCCATCTTTTATAGATATCTCCTACTGGGATAGGTGGATTATTTGTCATCCATCCTATTTGTTCCTGAAGGGTACTAGTAGTTCCTGCTATATCACTTCCCCTTGGTTCTCTCATTTGGCCTGGTGCAACAGGCCCTGCATGCACTGGATGCAATCTATCCCATTCTGCAGCTTCCTCATTGATGGTCTCTTTTAATATTTGCATTGCTGCTTGATGTCCCCCCACTGTATTTAGCATGGTGTTTATATCTTGTGGGGTGGCTCCTTCTGCTAATGCTGAAAACATAGGTATTACTTCTGGGCTAAAAGCCTTTTCTTCTACTACTTTTACCCATGCATTTAAAGTTCTAGGTGACATGGCCTGATGTACCATTTGCCCCTGGAGGTTTTGCACTATAGGGTAGTTTTGGCTGACCTGGCTGTTATTTCCTGCGCCAGCTGCTGCTTGCTGTGCTTTCATCTTGCTTTTGTTTTGCTCTTCCTCTATCTTATCTAGCGCTCCCTTGGTGTCTTGTATCTCTATCCTTTGATGTATACAATAGAGGACCGCTACTGTATTATATAATGATTTAAGCTCTTCTGACCCTGTTTGGAGGGATGGCTGTAGCTGTCCCAGTATTTGTCTACAGCCTTCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGCTCCCTGCTTGCCCATACTAGATGTTTTAACCTATATTTTTTCTTTCCTCCTGGCCTTAACCGAATTTTTTCCCATTGGTCTAATTTTCCCCCGCTTAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGGTAAAAACTTTTTTGGCGTACTCACCAGTCGCCGAAGCAATGAGCCAAGTAAATTCAACTACCGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAAGAAGACTGTTAAGTGTTTCAACTGTGGTAAAATAGGGCATATAGCAAAAAATTGCAGGGCCCCCAGGAGAAAGGGCTGTTGGAAATGTGGACAGGAAGGACACCAGATGAAAGATTGTAGTGAGAGACAGGCTAATTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAA +MK116110.1,pol,1393,4404,1435,4446,forward,0.2475474244944199,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED,FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED*,TTTTTTAGGGAAACTCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCTTCAGGTTTGGGGAAGAGACAGCAACTCCCCCTCAGAAGCAGGAGCCGATAGACAGGGAACTATATTCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCTCAATAAAAGTAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGTGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGATCAGATACCCATAGAAATCTATGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATTTGTTGACTCAGATTGGGTGCACTTTAAATTTTCCCATTAGTCCTATCGAAACTGTACCAGTAAGATTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAGATTTCAAAGATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGGGAACTTAATAAGAGAACTCAAGATTTCTGGGAAGTTCAATTGGGAATACCGCATCCCGCAGGATTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCATTAGATAAAGACTTTAGGAAGTATACTGCATTTACCATACCCAGTGTAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAGCTAGCATGACAAAAATTTTAGAGCCTTTTAGGAAGCAAAATCCAGACATGGTTATTTATCAATACATGGATGATCTATATATAGGATCTGACTTGGAATTAGGACAGCATAGGACAAAAATAGAGGAACTGAGACAACATCTATTGAGGTGGGGGTTTACCACACCAGACAAGAAGCATCAGAAAGAACCTCCATTCCTCTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAACACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTAGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTAAGGCAGTTATGTAAACTCCTTAGAGGAACCAAATCACTAACAGAAGTAGTACCACTAACAAGAGAGGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAATTACAAAAGCAGGGACAAGGCCAGTGGACTTATCAGATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATAAAGGGTACCCACACTAATGATGTAAAACAATTAACACAGGCTGTGCAAAAAATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTTAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGACCCCATAGTAGGAGCAGAAACATTCTATGTCGATGGGGCAGCCAATAGGGATACTAAATTAGGAAAAGCAGGATATGTTACTGACAGGGGAAGACAAAAAATTGTCCCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTTACCTAGCTCTGCAGGATTCAGGATCAGAAGTAAACATAGTATCAGACTCACAGTATGCAATAGGAATTCTTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGACATGGGTGCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTATTATTCTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCCATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGTTAAAAGGAGAAGCCATACATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTGGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTGGCCAGTGGATATATTGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATATTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAACACAATACATACAGACAATGGCAGCAACTTCACTAGCACTGCGGTTAAAGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGGGATCAAGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGAGGTACAGTGCAGGGGAAAGAATAGTAGACATGATAGCATCAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGAAATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGACTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAA +MK116110.1,vif,4349,4927,4391,4969,forward,0.4686663095875737,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH,MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAATGCATGGAAAAGCTTAGTAAAGCACCATATGCATGTTTCAAGGAAAGTTGAGAGATGGGTTTATAAACATCACTATGAAAGTACTAATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAAAAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAAGAGCTATAATACACAAGTAGACCCTGAAGTAGCAGACCAACTAATCCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAAAGCCATAGTAGGACATAGAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCCCTACAGTACTTGGCATTAGCAGCATTAGTAAAATCAAAAAAGACAAAGCCACCTTTGCCTAGCGTTACGAAGCTGACGGAGGATAGATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAG +MK116110.1,vpr,4867,5157,4909,5199,forward,0.4534005037783373,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP,MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP*,ATGGAACAAGCCCCAGAGGACCAAGGGCCGCAGAGGGAACCATATAATGAATGGGCACTAGAGCTTTTAGAGGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGGATATGGCTTCAGAGCTTAGGACAATACGTCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTTTGCAACAAATGCTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACGAGGGAGAACAAGAAATGGAGCCAGTAGACCCTAG +MK116110.1,tat_exon1,5138,5356,5180,5398,forward,0.48719691819623834,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ,MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ*,ATGGAGCCAGTAGACCCTAGCCTAGCGCCCTGGAAGCACCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGCTATTGTAAAAAGTGCTGCTTACATTGCCAAGTTTGTTTCACAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAA +MK116110.1,rev_exon1,5277,5354,5319,5396,forward,0.4267425320056898,MAGRSGDSDEDLLKAVRLIKILYQSS,MAGRSGDSDEDLLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGT +MK116110.1,vpu,5369,5614,5411,5656,forward,0.46373488953730724,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL,MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL*,ATGCAATCTTTGCAAATAGGAGCAATAGTAGCATTAGTAGTAGGAACAATAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAAGAAAATAGATAGAATAATAGATAGAATAGTAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAG +MK116110.1,env,5532,8072,5574,8123,forward,0.47450452559300893,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL,MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL*,ATGAGAGTGAAGGAGACCAGGAAGAGTTATCAGCACTGGTGGAAAGGGGGCATGATGCTCCTTGGAATGTTAATGATCTGTAGTGCTGCAACAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACGCATGCCTGTGTACCCACGGACCCCAACCCACAAGAAGTATTATTGGGAAATGTGACAGAAGATTTTAATGCATGGAAAAATAACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTTTGTGTTATTTTGCATTGCACTGATGTCAACAATACTAGAAATGGGATGACAGGAGAACTAAAAAACTGCTCTTTCAATATCACCACAAAAATAACAAATAAGGTACAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTACCAATAAATAATAAGGATAATGATACTAGCTTTAATAATAATAGCTATAGGTTGATAAGTTGTAACACCTCAGTTATTACACAGGCTTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTACTGTACCCCGGCTGGTTATGCAATTCTAAGGTGTAACAATGAGACATTCAGTGGAAAAGGGCCATGTACAAATGTCAGCTCAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGCAGTCTAGCAAAACAGGAGGTAGTAATTAGATCTCAAAATTTCTCGGACAATGTTAAAACCATAATAGTACAGCTGAAGACCCCTGTAAAAATTAACTGTACAAGGCCCAATAACAATACAAGAAAAAGTATACATGCAGGACCAGGGAAAGTAATTTATGCAACAGGAGAAATAATAGGAGATATAAGACAAGCACATTGCAACATTAGTGCAGCAGAGTGGAATGATACTTTAGGACAGATAGTTACAAAATTACAAGAACAATTTGGGAATAAAACAATAGTCTTCAATCAATCGTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTTTACTGTAATTCAACACAACTGTTTAATAGTACTTGGAATAATAATGGTACTAATACTTGGAATAGTACAGGTAATATCACACTCCCATGTAAAATAAGGCAAATTGTAAACATGTGGCAGAAAGTAGGAAAAGCAATGTATGCTCCTCCCATCCGTGGACAAATTAAATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAACGAGAGTGAGAGCGAAACCTTCAGACCTGGCGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGACTAGCACCCACTAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAACACTGGGAGCTGTGTTCCTTGGGTTCTTGGGAACAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAAGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATTAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGCAATAAATCTCTGAATGAAATTTGGGATAACATGACCTGGATGGAGTGGGAAAAAGAAATTAGTAATTACACACAATTAATATACACTTTAATTGAAGAATCGCAGAGCCAGCAAGAAAAGAATGAACAAGAATTATTGGCACTAGATAAGTGGGACAGCTTGTGGAGTTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAATAGGGTTAAGAATAGTTTTTACTGTACTTTCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTGTCATTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTAGTACAAAGAGCTTGTAGAGCTATTCTCCACATACCTGTAAGACTAAGACAAGGCTTAGAAAGAGCTTTGCTATAA +MK116110.1,tat_exon2,7654,7749,7705,7797,forward,0.4464285714285715,RPASQPRGDPTGPKESKKTVERETETDPHA,RPASQPRGDPTGPKESKKTVERETETDPHA**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAA +MK116110.1,rev_exon2,7655,7939,7706,7981,forward,0.46126825660935467,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC,DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGACGGTGGAGAGAGAGACAGAGACAGATCCACACGCTTAGTAACCGGATTCTTACCACTTTTCTGGGACGACCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTACAATATTGGAGTCAGGAACTAAAAAAAAGTGCTGTTAG +MK116110.1,nef,8074,8694,8125,8751,forward,0.437094682230869,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC,MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTGTAAGGGAAAGAATAAGAAGAGCTGGGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGACAAACATGGAGCAATCACAAGTAACAATACACCAGCTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTTAGGCCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGATGATATACTCCCAGCAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGACCAGGGGTCAGGTTTCCACTGACCTTTGGATGGTGCTTCAAACTAGTACCACTTGAGACAGAGCAGGTAGAAGCGGCCACTGGAGGAGAGAACAACTGCTTGTTACACCCTTTGAACCAGCATGGGATGGATGACCCGGAGAGAGAAGTACTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAGAGCCAAAGAGCTGCATCCGGAGTACTACAAAGACTGCTGA +MK115527.1,gag,683,2182,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115527.1,pol,1975,4986,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115527.1,vif,4931,5509,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115527.1,vpr,5449,5739,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115527.1,tat_exon1,5720,5938,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115527.1,rev_exon1,5859,5936,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115527.1,vpu,5951,6196,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115527.1,env,6114,8654,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115527.1,tat_exon2,8236,8331,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115527.1,rev_exon2,8237,8512,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115527.1,nef,8656,9270,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK114997.1,gag,210,1718,789,2291,forward,0.27936962750716343,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCAAAGGATAAATGTAAAAGACACCAAGGAAGCTCTAGACACAATAGAGGAAGAACAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCATATCACCTAGCACTTTAAATGCATGGGTAAAAGTGATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATACTCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGATCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCCTCCATAATGGCGCAAGGAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK114997.1,pol,1511,4522,2084,5095,forward,0.26443159013103534,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAGAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGACAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAGGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACCAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAGATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTCCATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAATAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTAACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAATGGAATCAGAAAAATACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCCGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK114997.1,vif,4467,5045,5040,5618,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTAGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCCTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK114997.1,env,4985,8206,6223,8793,forward,0.6657028690558922,MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*LRALETSRKSTYDCL*QLLL*TVLLSLPSLLHHKRLRHLLWQEEAETATKSFSQQSESSSGSTRAVSITCNACLKNSSNSRISSSNNNSNSCVVYSINRI*ENFKTKENRQVN**NKRKSRRQWQ*K*RRPGGIISTCGDGASCSLGW**YVVPTTCGSQSIMGYLYGKKQLPLYFVHQMLKHMRQRSIMFGQPMPVYPQTPAHRK*H*KM*QKHLTCGKMTW*SRCMRI*SVYGIKA*SHV*N*PHSVLL*IALIV*VIILIII*RKKEK*KTALSMSPQE*EIG*QKNMHFSIDLM*YQ*MKIVEILRANIG**IVTPQSLHKPVQRYPLSQFPYIFVPRLVLRF*SVEIRNSMEQENVEMSAQYNVHMELGQ*YQLNCC*TAV*QKKR**LDLPISRTMLKP**YS*INL*KLIVQDPTIIQEEVYT*DQGEHFMEQT**GI*DKRIVTLVGKIGMTL*KKIVIKLKEKFENKTIVFNQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAGTATTACATGTAATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGAAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAGTTTAAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAGACTTGATGTAGTATCAATAGATGAAGATAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGATATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAGAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAACCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGAGCATTTTATGGAACAGACATAATAGGGGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAAAAAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATGGTACTGATAATTGGAATGGTACTGAATCAAATAACACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCTCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACATTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAGTGGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAGGCAGTGGGAAAAGGAAATTGACAATTACACAGACACAATATATAACTTAATTGAACTATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAGTTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTACTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK114997.1,vpr,4985,5275,5558,5848,forward,0.3120665742024965,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAGCTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK114997.1,tat_exon1,5256,5471,5829,6044,forward,0.4691531785127845,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG +MK114997.1,rev_exon1,5395,5475,5968,6045,forward,0.5290287574606619,MAGRSGDSDEELLTAVRIIKRLYQSSK,MAGRSGDSDEELLTAVRIIKRLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG +MK114997.1,vpu,5487,5732,6060,6308,forward,0.5568484042553192,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAAAAATAGCAGCAATAGTAGGATTAGTAGTAGCAACAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGAGACCAGGAGGAATTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK114997.1,tat_exon2,7788,7880,8375,8470,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK114997.1,rev_exon2,7789,8064,8376,8651,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK114997.1,nef,8208,8849,8795,9415,forward,0.5432971135257649,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC,MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTGCCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTTCAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTTCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGTCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAATATTTCAAGGACTGCTGA +MK115518.1,gag,739,2238,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115518.1,pol,2031,5042,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115518.1,vif,4987,5565,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115518.1,vpr,5505,5795,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115518.1,tat_exon1,5776,5994,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115518.1,rev_exon1,5915,5995,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115518.1,vpu,6007,6252,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115518.1,env,6170,8710,6223,8793,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115518.1,tat_exon2,8292,8387,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115518.1,rev_exon2,8293,8568,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115518.1,nef,8712,9326,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115065.1,gag,221,1729,789,2291,forward,0.2880084183556756,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP,MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATGGGAAAAAATTTACCTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAGAGTCATCAGAAGGCTGCAGGCAAATTCTGGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGCGTACATCCAAGGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAGGGGCAAATGGTACATCAACCCTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGCTGAGGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAGGGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATCCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGGGATTATGTAGACCGGTTCTATAAAACTCTAAGGGCTGAGCAAGCGTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAATCAGCCTCCATAATGGTGCAGGGAGGCAATTTTAGGAACCAAAGAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK115065.1,pol,1522,4533,2084,5095,forward,0.25117173416656646,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED,FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTGGGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAGGAGGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATTTGTGGACATAAAGCTATAGGTACAGTATTAATAGGACCTACACCAGTCAACATAATTGGAAGAAATCTGTTGACCCAGCTTGGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATGGAAAAGGAAGGGAAAATTACAAAAATTGGGCCTGAGAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCCGAGAACTTAATAAGAGAACACAAGACTTCTGGGAAGTTCAACTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAGGAGTTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGGAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGATTTAGAAATAGAGCAGCACAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGGGGTGGGGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTGGACTATCAATGACATACAGAAGTTAGTGGGAAAGTTGAATTGGGCAAGCCAAATCTATCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGGGGAGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCTATACAAAAGGAAACATGGGAAATGTGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAGACTAAATTAGGAAAAGCAGGGTATGTTACGGACAGAGGAAGACAAAAGGTTGTCTCCCTAATGGACACAACAAATCAGAGGACTGAGTTACACGCTATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAGGGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAGGAAAAGATTTACCTGGCATGGGTCCCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTAGTGGAATCAGAAAAGTACTATTTCTGGATGGAATAGATAAGGCCCAAGAAGAACATGAAAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAGGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115065.1,vif,4478,5056,5040,5618,forward,0.3903081914030819,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGGGTTTACAGACATCACTATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAGGGGAAGCAAGATTGGTAATAAAAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGCCAGGGAGTATCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAG +MK115065.1,vpr,4996,5286,5558,5848,forward,0.3351206434316354,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGTCCCAGAGGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTGGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115065.1,tat_exon1,5267,5485,5829,6044,forward,0.48954161103693805,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ,MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115065.1,rev_exon1,5406,5483,5968,6045,forward,0.4886988393402566,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115065.1,vpu,5498,5743,6060,6308,forward,0.5568484042553192,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM,MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGTCTATAGTATTAATAGAATATAGGAAAATTTTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAG +MK115065.1,env,5661,8261,6223,8793,forward,0.5052314240113498,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL,MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL*,ATGAAAGTGACGGGGACCAGGAGGAGTTATCAGCACTTGTGGAGATGGGGCATCTTGTTCCTTGGGATGGTGATGATATGTAGTGCCAACAACTTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTGGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATAATTTAAATCTAAATCGCCCTAACAATAATACTTGTAGTAATAATACTAATTATAATATAACGGAAAAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAGGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAGGTAGTGGAAATACTACGGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATGGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAGGGAGGGCATTTTATGGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTGGGAAAGATTGGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTGAGAATAAAACAATAGTCTTTACTCAATCCTCAGGAGGGGACCCAGAGATAGTGATGCATAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAATAGTACTTGGAATGGTACTGACAATTGGAATGGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAGGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATGGTGGGAGCAACAATAGTAGTAATGATACAGAGACCTTCAGGCCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAGGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAAAGGGAAAAAAGAGCAATAGGACTTGGAGCTTTCTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTAATGTGCCCTGGAATATTAGTTGGAGCCCTAGATGGAATAGATCTCTAGATGAGATTTGGACTAACATGACCTGGAAGCAGTGGGAAAAGGAAATTGACAATTACACAGACATAATATATAACCTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTGGCATTAGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATTACACAGTGGCTATGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGATAGGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +MK115065.1,tat_exon2,7843,7935,8375,8470,forward,0.4918032786885247,RPSSQPRGDPTGPKEQKKEVERETEAHPRD,RPSSQPRGDPTGPKEQKKEVERETEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAG +MK115065.1,rev_exon2,7844,8119,8376,8651,forward,0.40871934604904625,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE,DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAGGAACAGAAGAAGGAGGTGGAGAGAGAGACAGAGGCACATCCACGAGATTAGTGCATGGATTCTTAGCACTCATCTGGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGCGGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTGAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAAATAAAGAATAG +MK115065.1,nef,8263,8904,8795,9415,forward,0.5339772804571117,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGGGTAACAAGTTGTCAAGAGGGCTCAGGGCTGGATGGCCTACCATAAGGGAGAGAATGAGACGAGCTAGGCCAGTAAGAGAGCCAGAGCCAGCAGCAGCTGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTGGAAGCACAACAGGAGGAGGAAGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAGGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAGGGCCAGGAGTCAGATTTCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAGAACCTGCATGGAATGGAGGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115464.1,gag,527,2296,789,2291,forward,0.706855791962175,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ,MLQAIPGLRVGPAGSHPFALTSLSASCCHQSQSPGCSGATARTGT*KRK*NQRSSLDAGLGLLKRARQEARGGDW*VRQF*LAEARRREISARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADKGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNA*VKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAE*DRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIA*MTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ*,ATGCTTCAGGCCATCCCTGGTTTGAGGGTGGGTCCCGCCGGGTCCCACCCCTTTGCACTCACGAGCCTGTCTGCCTCCTGCTGCCATCAATCACAGAGCCCAGGCTGTTCGGGCGCCACTGCCCGAACAGGGACCTGAAAGCGAAAGTAGAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGAGGCGGCGACTGGTGAGTACGCCAATTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAAGTGCGAGAGCGTCTGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCCGGCCTTTTAGAAACAACAGAAGGATGTAAACAAATACTGGAACAGCTGCAACCATCCCTTCCGACAGGATCAGAAGAACTTAGATCATTATTTAATACAGTAGCAACCCTCTATTGTGTGCATAAGAGAATAGAGGTACAAGACACCAAGGAAGCCTTAGAAAAGATAGAAGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAGGCAGTAGCTGACAAAGGAAGTACCAGCCAGGTCAGCCAAAATTACCCGATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGGCCATATCGCCTAGAACTTTAAATGCATAGGTGAAAGTAGTAGAAGAGAAGGCCTTTAGCCCAGAGGTAATACCCATGTTTTCAGCATTATCGGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATAAGATAGAGTGCATCCAGTGCATGCAGGGCCTGTTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATAGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTAGGATTAAATAAGATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAGTCCTAAGAGCCGAGCAAGCATCACAGGATGTAAAAAATTAGATGACAGAAACCTTATTAGTCCAAAATGCAAACCCAGATTGTAAGACTATTTTAAAAGCATTAAGACCAGCAGCAACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAAATATCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGACTGTTAAGTGTTTCAATTGTGGCAAAGAAAGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MK115464.1,pol,2089,5100,2084,5095,forward,0.7518376924488996,AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED,FFKEDLAFLQRKAKELSSEQTRANSPTRRELQV*GGDSNSSSEAGAGGQRSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEISLPGR*KPKMIEGIGGFIKVRQYDQITIEICGHKAIGTVLVGPTPVNIIGRNLLTQISCTLNFPISPIETVPVQLKPGIDSPKVKQWPLTEEKIKALVEICTEMEKEKKISKIRPENPYNTPVFAIKKKDSTK*RKLVDFKELNKRTQDF*EVQLRIPHPARLKKKKSITVLDVGDAYFSIPLDKDFKKYTAFTIPSINNKTPEIRYQYNVLPQG*KRSPAIFQSSMIKILEPFRKQNPDIVIYQYIDDLYVRSDLEIRQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFLWISYELHPDKWTVQPIVLPDKDSWTVNDIQKLVRKLN*ASQIYAEIKVRQLCKLLKGAKALTEVIQLTEEAELELAENKEILKEPVHEVYYDPSKDLIAELQKQRQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVI*GKTPRFKLPIQKET*DT*WTEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVGAETFYVDRAANKETKLRKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALRIIQAQPDKSESEIVNQIIEQLIKKEKVYLA*VPAHKRIRRNEQVDKLVSARIRKVLFLDRIDKAQEEHKKYHNN*RAMASDFNLPPVVAKKIVASCDKCQLKKEATHRQVDCSPRIWQLDCTHLEGKVILVAVHVASRYIEAEVIPAETGQETAYFLLKLAGR*PVKAIHTDNGTNFTSATVKAAC**AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATCTGGCCTTCCTCCAAAGGAAGGCCAAGGAACTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTAGGGAGGAGACAGCAACTCCTCCTCAGAAGCAGGAGCCGGTGGACAAAGAAGTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGACACAGTATTAGAAGAAATAAGTTTGCCAGGAAGATAGAAACCAAAAATGATAGAAGGAATTGGAGGCTTTATCAAAGTAAGACAGTATGATCAGATAACTATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGCAGAAATTTGTTGACTCAGATTAGTTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTACAATTAAAACCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAAGAAAAAAAGATTTCAAAAATTAGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGAAGAAAATTAGTAGATTTCAAGGAACTTAATAAAAGAACTCAAGACTTCTAAGAAGTTCAATTAAGAATACCACACCCCGCAAGGTTAAAAAAGAAGAAATCAATAACAGTACTAGATGTAGGTGATGCATATTTTTCAATTCCCTTAGATAAAGACTTCAAGAAGTATACTGCATTTACCATACCTAGTATAAATAATAAGACACCAGAGATTAGATATCAGTACAATGTGCTTCCACAGGGATAGAAAAGATCACCAGCAATATTCCAAAGTAGCATGATAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGACATAGTTATCTATCAATACATAGATGACTTGTATGTAAGATCTGACTTAGAAATAAGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACACTTGTTGAAGTAGAGATTGACCACACCAGATAAAAAACATCAGAAAGAACCCCCATTCCTGTGGATAAGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGACAAAGATAGCTGGACTGTCAATGACATACAGAAGCTAGTAAGAAAATTGAATTGAGCAAGTCAGATTTATGCAGAGATTAAAGTGAGACAATTATGTAAACTCCTTAAAGGAGCCAAAGCGCTAACAGAAGTGATACAACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAAGAAATTCTAAAAGAACCAGTACATGAAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAGTTACAGAAGCAGAGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAACGAGAGGTACCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTGATATGAGGAAAGACCCCTAGATTTAAACTACCCATACAGAAAGAAACATAAGATACCTAGTGGACAGAATATTGGCAAGCCACCTAGATTCCCGAGTAAGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATAGTACCAATTAGAAAAAGAGCCTATTGTAGGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAAAGAGACTAAATTAAGAAAAGCAGGATATGTTACTAGCAGAGGAAGACAAAAGGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAACTGCAAGCAATTTGTCTAGCATTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCACTAAGAATAATTCAAGCACAACCAGATAAGAGTGAATCAGAGATAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTACCTTGCATAGGTACCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTGCTAGAATCAGGAAAGTCCTATTTTTAGATAGAATAGATAAGGCCCAAGAAGAGCATAAGAAATATCACAATAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAAAAATAGTAGCCAGTTGTGATAAATGCCAGCTAAAAAAAGAAGCCACGCATAGACAAGTAGACTGTAGTCCAAGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAGTTATCCTAGTAGCAGTTCATGTAGCCAGTAGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTCCTCTTAAAATTAGCAGGAAGGTAGCCAGTGAAAGCAATACATACAGACAATGGAACCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTAGTAGGCAAAGATCAAGCAGGAATGTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTCCAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAACAGAGATCCACTTTGGAAAGGACCAGCAAAACTTCTTTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAAGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115464.1,vif,5045,5623,5040,5618,forward,0.7067546928117459,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY,MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY*GLHTGERDWHLGQGVSIEWKERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRRSQTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGCACATGGAAAAGTTTAGTAAAACACCATATGTACATTTCAAAGAAAGCCCAAGGATGGTTTTATAGACATCACTATGAAAATCCTCATCCAAGAATAAGTTCAGAAGTACACATCCCGCTAGGGGATGCTAGATTGGTAATAACAACATATTAGGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGTCAAGGAGTCTCCATAGAATGGAAGGAAAGGAAATATAGCACACAAGTAACCCCTGACCTAGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTGCAGAATCTGCTATAAGAGAGGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAGTAACACCAAAAAAGACAAAGCCACCTTTGCCTAGTGTGACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAG +MK115464.1,vpr,5563,5853,5558,5848,forward,0.37688442211055273,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAG +MK115464.1,tat_exon1,5563,6051,5829,6044,forward,0.7571801566579635,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS,MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS*IRALEASRKSA*DSLYQMLL*KMLLSLPSLFHNKRLRHLLWQEEAETATKTSSRQSDSSSTSTKAV,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAAGGAGCCAAACAATGAATGGACACTAGAGCTCTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTTCCTAGGACATGGCTTCATGGCTTAGGACAACATATCTATGAAACTTATGAGGATACTTGGACAGGAGTAGGAGCCTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTAGGTGCCAACATAGCAGAATAGGCATCACTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAAATGCTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTG +MK115464.1,rev_exon1,5973,6050,5968,6045,forward,0.4267425320056898,MAGRSGDSDEDLLKTVRLIKYLYQSS,MAGRSGDSDEDLLKTVRLIKYLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGT +MK115464.1,vpu,6065,6310,6060,6308,forward,0.7521692502681095,MQSLYILTIVALVVAAILAIVV,MQSLYILTIVALVVAAILAIVV*AIVLIEYKKILKQRRIDRLIDRIIDKAEDSGNESEGDQEELSAFVEIGHHAP*NVDDL*,ATGCAATCTTTATATATATTAACAATAGTAGCATTAGTAGTAGCAGCAATATTAGCAATAGTTGTGTAGGCCATAGTACTCATAGAATATAAGAAAATATTAAAACAAAGGAGAATAGATAGGTTAATTGATAGAATAATAGATAAGGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAG +MK115464.1,env,6228,8798,6223,8793,forward,0.7471048806788873,MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST,MRVKEIKRSYQHL*R*GIMLLRMLMIYSTADQWWVTVYYKVPVWREANTTLFCASDAKAYSTEAHNV*ATHACVPTDPNPQEIVIENVTEDFNMWKNNMVDQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTSNTT*GEMTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST*TKNGTDSWQSNDTQNSNITLQCRIKQIINLWQEVRKAMYAPPISRQINCTSNITGLVLTRDRRNETKTFRPGRENMKDNWRSKLYKYKVVRIEPLRIAPTKAKRRVVQREKRAVRLGAMFLKFLGAARSTIGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLAVERYLQDQQLLGL*GCSRKLICTTTVP*NRS*GRHNKNYKSLDDI*DNMT*IE*EKEIDNYTSLIYTLITESHSQQKKNEQELLALDK*ASL*N*FDISQWLWYIKIFIMIVGGLVSLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPERIEERGRERDKGRSGRLVNGFLALI*DDLRSLCLFSYHRLSDLLLIVIKIVELLRRKR*EALKY**NLLQY*SQELKNSAVSLLNTTAIVVAERTDKIIEILQRISRAFLHIPRRIRQGLEKALL*,ATGAGAGTGAAGGAGATCAAGAGGAGTTATCAGCATTTGTAGAGATAGGGCATCATGCTCCTTAGAATGTTGATGATCTATAGTACTGCAGACCAGTGGTGGGTCACAGTCTATTATAAGGTACCTGTGTGGAGAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGCACATAATGTTTAGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATAGTAATAGAAAATGTAACAGAAGATTTTAACATGTGGAAGAATAACATGGTAGATCAGATGCATGAGGATATAATCAGTTTATAGGATCAAAGTCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGTACTGATATTAGGAATAGTACCGTTACTTCTAATACTACTTCTAATACTACTTAGGGAGAAATGACAAACTGCACTTTCAATATCACCACAAGCATAAAGGATAAGATAAAAAAAGAAGCGGCACTTTTTTATAAAATTGATTTAGTAGAAATAGATGAAAAGAAAAATAACAGTAGTACCAGATATAGGTTGATAAATTGTAACACCTCAGCCATTACACAAGCCTGCCCAAAGGTATCCTTTAAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCAATTCTAAAGTGTAATAATAAGAAGTTCAGTGGAAAAGGACCATGTACAAATGTCAGCACAGTGCAATGTACACATAGAATTAAGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAATGATTAGATCTGACAATATCACAGACAATACTAAAAACATAATAGTACAGTTGAAAGAAGCCATACGAATTTTCTGTATAAGACCCAACAACAATACAAGAAAAAGTATAAATATAAGACCAGGAAGAGCATTTTATACAACAGGAGATATAATAAGAGACATAAGGCAAGCACATTGTAACATTAGTGGAAATTGGAGTAACACTTTAAAACAGATAGCTACACAATTAGGAAAACAACTGAATCAAACACAACAAATAATCTTTAATTCATCCGCAGGAAAGGACCCAGAGATTGTAACACACAGTTTTAATTGTGGAAAGAAATTCTTCTATTGTAATTCATCATCACTGTTTAATAGTACCTAGACTAAAAATGGTACTGATAGTTGGCAGTCTAATGATACTCAGAATAGTAATATCACACTCCAATGCAGAATAAAACAAATTATAAACCTGTGGCAGGAAGTAAGAAAAGCAATGTATGCCCCTCCCATCAGTAGACAAATTAACTGTACATCAAATATTACAGGGCTAGTTTTAACAAGAGATAGGAGGAATGAAACTAAGACCTTTAGACCTGGAAGAGAAAATATGAAGGATAATTGGAGAAGTAAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAAGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAGAAAAGAGCAGTAAGACTAGGAGCTATGTTCCTTAAGTTCTTAGGAGCAGCCAGAAGCACTATAGGCGCAGCGTCGATAGCGCTGACGGAACAGGCCAGACGAGTCTTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATTTGTTGCAACTCACAGTCTAAGGCATTAAGCAGCTCCAGGCAAGAGTCCTGGCTGTAGAAAGATACCTACAGGATCAACAGCTCCTAGGACTTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTACTGTGCCTTAGAATCGTAGTTGAGGTAGGCATAACAAAAATTACAAAAGTCTAGATGACATTTAGGATAACATGACCTAGATAGAGTAGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTACAGAATCACATTCCCAACAAAAAAAGAATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAA +MK115464.1,nef,8194,9450,8795,9415,forward,0.6514772974147296,MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC,MNKNYWH*INRQVCRISLTYHNGCGI*KYS****EA**V*E*FLLYFL**IKLGKDTHHYHFRPSSQPREEPTGPKE*KKEVERETKADPVD**TDS*HLSRTIYGAYASSATTA*ATYS*L*SRLWNF*DARGKKPSNISRISCSTRVRN*RIVLSACSTPQL***LKGQIR**KYYKELVELFSTYLGE*DRA*KRLCYKIGGKWSKSSKVK*NAVKERIRRAQPTADKERAEPAADKVRAASRDLEKYGALTSKNTAATNADCAWLEAQEEEDEVGFPVRPQLPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC*,ATGAACAAGAATTATTGGCATTAGATAAATAGGCAAGTTTGTAGAATTAGTTTGACATATCACAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAAGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAAAGTTAGGCAAGGATACTCACCATTATCATTTCAGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACACCACAGCTATAGTAGTAGCTGAAAGGACAGATAAGATAATAGAAATATTACAAAGAATTAGTAGAGCTTTTCTCCACATACCTAGGAGAATAAGACAGGGCTTAGAAAAGGCTTTGCTATAAGATAGGTGGCAAGTGGTCAAAAAGTAGTAAGGTTAAATAGAATGCAGTGAAAGAAAGAATAAGACGAGCTCAGCCAACAGCAGATAAAGAACGAGCTGAGCCAGCAGCAGATAAGGTAAGAGCAGCATCTAGAGACCTAGAAAAATATGGAGCACTTACAAGTAAGAATACAGCAGCTACTAATGCTGATTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGATGAGGTAGGTTTTCCAGTCAGACCTCAGTTACCTTTAAGACCCATGACTTATAAAGCAGCTCTAGATCTGAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAGTTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTATTTCCCTGATTGGCAGAACTACACACCAGGGCCAAGGATCAGATATCCCCTGACCTTTGGATGGTGCTTCAAGCTAGTACCACTTGAGCCAGATCAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCCTGTTACACCCTCTGAGCCAGCATAGGATGGATGACCCGGAGAAAGAAGTGCTAGTGTGGAGATTTGACAGCCGCCTCGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTTCTACAAAGACTGCTGA +MK115464.1,tat_exon2,8380,8475,8375,8470,forward,0.6995153473344102,RPSSQPREEPTGPKE,RPSSQPREEPTGPKE*KKEVERETKADPVD**,AGACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGA +MK115464.1,rev_exon2,8381,8656,8376,8651,forward,0.5716671727907683,RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE,DPPPSPERSRQARKNRRKR*RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE*,GACCCTCCTCCCAGCCCCGAGAGGAGCCGACAGGCCCGAAAGAATAGAAGAAAGAGGTAGAGAGAGAGACAAAGGCAGATCCGGTCGATTAGTGAACGGATTCTTAGCACTTATCTAGGACGATCTACGGAGCCTATGCCTCTTCAGCTACCACCGCTTGAGCGACTTACTCTTGATTGTGATCAAGATTGTGGAACTTCTAAGACGCAAGAGGTAAGAAGCCCTCAAATATTAGTAGAATCTCCTGCAGTACTAGAGTCAGGAACTAAAGAATAG +MK115530.1,gag,746,2245,789,2291,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115530.1,pol,2038,5049,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115530.1,vif,4994,5572,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115530.1,vpr,5512,5802,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115530.1,tat_exon1,5783,6001,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115530.1,rev_exon1,5922,5999,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKILYQSS,MAGRSGDSDEELLKAVRLIKILYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +MK115530.1,vpu,6014,6259,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115530.1,env,6177,8717,6223,8793,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115530.1,tat_exon2,8299,8394,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115530.1,rev_exon2,8300,8575,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115530.1,nef,8719,9333,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115520.1,gag,695,2194,789,2291,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115520.1,pol,1986,5003,2084,5095,forward,0.6033592883813991,YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,IF*GKSGLPTKEGQGTSFRADQSQQPHQKRASGLGKRQ*LPLRSRSQETRNCIPCLPSNHSLAATPRQNKNRGAI*RSFLRYRSR*YSIRRNEFARKMETKNDRGNWRFYQSKTV*SDTHRNLWTQSYRYSINRTYTCQHNWKKSVDSAWLYLKFSH*SY*NCTSKIKARNGWPKS*TMAIDRRKNKSISRNLYRNGKGRKNFKNWA*KSIQYSSICYKEKRQY*MEKISRFQRTQ*ENSRLLGSSIRNTTSCRVKKEKISNSTGCG*CIFFNSLR*RIQEVYCIYHT*YK**DTRD*V*VQCAATGMERITSNIPK*HDKNLRAF*KAKSRYSYLSIHG*FVCRI*LRNRAA*NKNRGTKTTSVKVGTYHTRQKTSERTSIPLDGL*TPS*YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,ATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAAATAGGGGGGCAATTTAAAGAAGCTTTCTTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATATGGGAAATGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115520.1,vif,4948,5526,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115520.1,vpr,5466,5756,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115520.1,tat_exon1,5737,5955,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115520.1,rev_exon1,5876,5956,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115520.1,vpu,5968,6213,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115520.1,env,6131,8671,6223,8793,forward,0.4585964351370794,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAGATAAGATGCAGAAAGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAAATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGGATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTTAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115520.1,tat_exon2,8253,8348,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115520.1,rev_exon2,8254,8529,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115520.1,nef,8673,9287,8795,9415,forward,0.4690990320178705,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAATGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGATACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTGCACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115503.1,gag,817,2316,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115503.1,pol,2109,5120,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115503.1,vif,5065,5643,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115503.1,vpr,5583,5873,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115503.1,tat_exon1,5854,6072,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA +MK115503.1,rev_exon1,5993,6073,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115503.1,vpu,6085,6330,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115503.1,env,6248,8788,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115503.1,tat_exon2,8370,8465,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115503.1,rev_exon2,8371,8646,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115503.1,nef,8790,9404,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115570.1,gag,687,2186,789,2291,forward,0.2967573174581697,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCGACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115570.1,pol,1979,4990,2084,5095,forward,0.19298018391400085,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115570.1,vif,4935,5513,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115570.1,vpr,5453,5743,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115570.1,tat_exon1,5724,5939,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115570.1,rev_exon1,5863,5943,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115570.1,vpu,5955,6200,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115570.1,env,6118,8658,6223,8793,forward,0.4620723847297967,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCTCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAGGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115570.1,tat_exon2,8240,8335,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115570.1,rev_exon2,8241,8516,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115570.1,nef,8660,9274,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115509.1,gag,555,2054,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115509.1,pol,1847,4858,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115509.1,vif,4803,5381,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115509.1,vpr,5321,5611,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115509.1,tat_exon1,5592,5807,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115509.1,rev_exon1,5731,5811,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115509.1,vpu,5823,6068,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115509.1,env,5986,8526,6223,8793,forward,0.4581222593756883,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115509.1,tat_exon2,8108,8203,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115509.1,rev_exon2,8109,8384,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115509.1,nef,8528,9142,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115702.1,gag,246,1781,789,2291,forward,0.35613851839948674,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ,MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ*SQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGCGGCGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAGGAAACGATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGCTTCGCAGTCAACCCTGGCCTGTTAGAAACATCAGAAGGCTGCAAACAAATAATGGGACAACTCCAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAGTCCTCTATTGTGTACATCAGAGGATAGATGTAAAGGATACCAAAGAAGCTTTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGACACAGCAAGCAGCAGCCGCTGACACAGGAAACAACAGCCAAGTCAGCCAAAATTACCCCATAGTGCAGAACATGCAGGGACAAATGGTACATCAGGCCATATCACCCAGAACCCTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCATTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAGGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAGGCTGCAGAATGGGATAGAGTGCATCCAGTGCAGGCAGGACCTGTTGCACCAGGCCAGATAAGGGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACACATAATCCACCCGTCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAGACTCTAAGAGCTGAGCAAGCTTCACAGGAAGTAAAAGGTTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACCATTTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCAGCCATAAGGCAAGGGTTTTGGCAGAAGCAATGAGCCAAGCAACAGGTGCACATGCCATAATGATGCAGAGAGGCAATTTTAAGAACCAAAGAAAGACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGACTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAA +MK115702.1,pol,1544,4585,2084,5095,forward,0.24526399193257942,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAGGAGAGCCTCAGGCCAACAGCCCCACCAGTAGAGAGCTTCAGGTTTGGGGAAGAGACAGCAGCCCCCTTTCAGAAGCAGGAACCGAGAGACAAGGAGATGTCTCCCTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCAGTAGTCACAATAAAGATAGGGGGGCAAATAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGAAATGGCGTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATAGCCATAGAAATTTGTGGACATAAAGCAATTGGTACAGTATTAGTAGGACCTACACCTGTCAATATAATTGGAAGAAATCTATTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAGTTAAAGCCAGGAATGGATGGCCCAAAAATTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATAGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAAAAAGACAGTACTAAGTGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGATTAAAAAAGAAAAAATCAATAACAGTACTGGATGTGGGTGATGCCTATTTTTCAGTTCCCTTAGATGAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATATTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGACGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTAAGAGGACATCTGTTGAAGTGGGGGTTTACCACACCAGACAAAAAACATCAGAAGGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAGATGGACAGTACAGCCTATAAAGCTGCCAGAGAAAGAAATCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATTAAAGTAAAACAATTATGTAAACTCCTTAGGGGAACCAAAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGAGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGAATTAATAGCAGAAATACAGAAGCAAGGGCAAGGCCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCGAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAGAAAATATCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAGGAAACATGGGAAATATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTTAGTACTCCTCCCCTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCATCTAATAGGGAGACTAAATTAGGAAAAGCAGGATATATTACTGACAGAGGAAGACAAAAGGTTGTCACCCTAAATGACACAACCAATCAAAAGACAGAGTTACAAGCAATTCTTCTAGCATTGCAGGATTCAGGATTAGAAGCAAACATAGTGACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGATCTACCTGACATGGGTACCAGCACATAAAGGAATTGGAGGAAATGAGCAAGTAGATAAATTAGTCAGTACTGGGATTAGGAAAGTATTATTTTTAGATGGAATAGATAGGGCCCAAGAAGAGCATGAGAGATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTCAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGACAAATAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACACTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTACCACAGTTAAGGCCGCCTGTTGGTGGGCGGGGGTCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTGGTAGAATCTATGAATAAAGAATTAAAGAAAATAATAGGACAGGTCAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTTCAAAAATTCAAAACTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCGGTAGTAATACAGGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115702.1,vif,4530,5108,5040,5618,forward,0.3566796368352788,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAAGAAAACTAAGGGATGGTTTTATAGACATCACTATGAGAGCACTCATCCAAAAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTGAGTTGGTAGTAACAACATATTGGGGTTTGCAGCCAGGGGAAAGGGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAGGGAGATATAGAACACACGTGGACCCTAACCTAGCAGACCAACTAATTCATCTGCATTACTTTGATTGTTTTTCAGAATCTGCTATAAGACATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAAGAGCACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACTAAACTAACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +MK115702.1,vpr,5048,5338,5558,5848,forward,0.3566796368352788,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS,MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAACTTAAGCAGGAAGCTGTTAGGCATTTTCCTAGGCCATGGCTTCATAGCTTAGGGCAATATATCTATGAAACTTATGGGGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATGCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATCCCACAGAGGAGAGCAAGAAATGGATCCAGTAGATCCTAA +MK115702.1,tat_exon1,5319,5534,5829,6044,forward,0.5237430167597767,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ,ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAG +MK115702.1,rev_exon1,5458,5538,5968,6045,forward,0.5622384937238494,MAGRSGDGDEDLLKAVRLIKTLYQSSK,MAGRSGDGDEDLLKAVRLIKTLYQSSK,ATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAAG +MK115702.1,vpu,5550,5807,6060,6308,forward,0.6039004707464695,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND,MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND**,ATGTTATCTTTAGAAGTAATAGTAGCAATAACAGCATTAGTAGTAGCAGGAATAATAGCAATAGTTGTGTGGACCATAGTACTTATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAAGATACTTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAA +MK115702.1,env,5716,8256,6223,8793,forward,0.5196110433453024,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE,MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE*DRA*,ATGAGAGTGAGGGGGATCAGGAAGAATTGTCAGCGCTTGTGGAGATGGGGCACAATGCTCACCATGCTCCTTGGGATATTAATGATTAGTAATGCTACAGAACAATTGTGGGTCACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAACAACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAATGGTATTAATAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGATCAAATGCAAGAGGACATAGTCAGCTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACCTTAAATTGCACTAATTTGACCATTGAGCCAAACAATGCTACTAAAGCCAATATTAGTGGGAGGTTAGAGGGGAAAGGAGAAATGACAAACTGCTCTTTCAATGTCACCACAAGCCTAAGAGATAAGAGGAAGAAAGAATATGCACTCTTTTATAAACTTGATGTAGTAGCAACAGGTGAAAATAATAACAGCTTTAGGTTGATAAGTTGTAATACCTCAGAGATTACACAGGCCTGTCCAAAGGTATCATTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAAAAGTTCAATGGAACAGGAAAATGTAACAATGTCAGCATAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAGTTAGATCTGCCAATTTCTCAGACAATACTAAGACCATAATAGTACAGCTGAACAAAACTGTAGTAATTAATTGTACAAGACCCAACAACAATACAAGGAGAAGTATACATATAGCACCAGGGAGAGCATTTTATGCAACAGGAGATATAATAGGAGATATAAGAAAAGCACATTGTAACATTAGTAAAGAAGATTGGAATACCACTTTAAACCAGGTGGCTAAAAAATTACAAGAACAATTTGAGAATGCAACAATAGACTTTAAACCATCCTCAGGAGGGGACCCAGAAATTGTAATGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACGGAACTATTTTCTTGGAATGCTACAACAAAACTGTTTACTTGGAATGCTACAAATAGCAATAATGGAACCATCATACTCCCATGTAGAATAAAACAAATTATAAACATGTGGCAAGAGGTAGGAAAAGCAATGTATGCCCCTCCCATTCGTGGACAAATTAGATGTTCGTCAAATATTACAGGACTGCTATTAACAAGAGATGGTGGGACTAACGGGACAGGGAACAGGAATGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAGAAATTAAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGACCATAGGAGCTATGTTCCTTGGGTTCCTGGGGGCAGCAGGAAGCACTATGGGCGCAGCATCACTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCGATTGAGGCGCAGCAGCATCTGTTGCAACTCACAGTCTGGGGCATAAAACAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGGTACCTAAGAGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATATTAGTTGGAGTAATAGAACTCTGAATAACATTTGGGACAATTTGACTTGGATGCAGTGGGATACAGAAATTAACAATTACACAAACAAAATATACCAATTACTTGAGGAAGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAATTTGTGGAATTGGTTTGACATATCAAACTGGCTGTGGTACATAAAAATATTCATATTAATAGTAGGAGGCTTAATAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTAAATGCCACAGCCATAGTAGTAGCTGAGGGGACAGATAGGATTATAGAATTAGCACAAAGAATTTGTAGAGCAGAATAAGACAGGGCTTGA +MK115702.1,tat_exon2,7874,7969,8375,8470,forward,0.32608695652173914,RPASQSRGDPTGPKEPKKKVERETETDPTD,RPASQSRGDPTGPKEPKKKVERETETDPTD**,AGACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGA +MK115702.1,rev_exon2,7875,8150,8376,8651,forward,0.3471418653089562,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE*,GACCCGCTTCCCAGTCCCGAGGGGACCCGACAGGCCCGAAGGAACCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGACAGATTAGTGAACGGATTCTTGACACTTATCTGGGTCGATCTGAGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCACTCAAATATTGGTGGAATGTCCTGCAATATTGGAGTCAGGAACTAAAGAATAG +MK115702.1,nef,8275,8895,8795,9415,forward,0.4680383864671438,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC,MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC*,ATGGGTGGCAAGTGGTCAAAACATAGTAAGAGTGAATGGGCTGATGTAAGGGAAAGAATGGCACAAACTGAGGCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGATCTGGAAAGACATGGAGCAATCACAAGTAGCAATACAGCAACTAACAATGCTGCTTGTGCTTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAAACCTCAGGTGCCTTTGAGACCAATGACCTACAAGGGAGCTTTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTATTCCCAAAAAAGACAAGACATCCTTGATCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGAACCAGATTCCCACTGTGCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTGGAAGAAGCCAATAAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACACCGAGAGAGAGGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACGTAGCCAGAGAGAAACATCCGGAGTACTTCAAGGACTGCTGA +MK115095.1,gag,2,1696,789,2291,forward,0.7478034493979825,MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC,SGFSFTFKSLFGRHLGDLKAKEKPEELSRRRTRLAERARQEARRGD**VRRNF*LAEARRREIGARASVLSGGELDR*EKIYLRPGRKKKYRLKHIVWASRELERFAVNPGLLKSSEGCRQILGQLQPALQTGSEELRSLYNTIAVLYCVHQKINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQIVHQPISPRTLNA*VKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVRRHQAAMQMLKETINDEAAE*DRLHPVHAGPIAPGQMKEPRRSDIAGTTSTLQEQIR*MTNNPPIPVGEIYKR*IILRLNKIVKMYSPVSILDIRQRPKEPFKDYVDRFYKTLKAEQASQDVKN*MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC*KCGKKGHQMKDCTKRQANFLRKIWPSHKGRPKNFLQSRPEPTAPPAESFRFKEEATAPPQKQETKDQELYPLASLRSLFGNDP*YQ*,TCTGGTTTCTCTTTCACTTTCAAGTCCCTGTTCGGGCGCCATCTAGGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCACGGCAAGAGGCGAGGCGCGGCGACTAGTGAGTACGCCGAAATTTTTGACTAGCAGAGGCTAGAAGGAGAGAGATAGGTGCGAGAGCGTCAGTATTAAGCGGCGGAGAATTAGATAGATAGGAAAAAATTTACCTAAGGCCAGGGAGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTCAACCCTGGCCTGTTAAAGTCATCAGAAGGCTGCAGGCAAATTCTAGGACAGCTACAACCAGCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAGATAAATGTAAAAGACACCAAAGAAGCTCTAGACAAAATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAACAAGCAGCAGCTGACACAGGAAACAGCAGCAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTACAAGGGCAAATAGTACATCAACCCATATCACCTAGAACTTTAAATGCATAGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCACTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGAGAAGACATCAAGCAGCCATGCAGATGTTAAAAGAAACCATCAATGATGAAGCTGCAGAATAAGATAGATTGCATCCAGTGCATGCAGGCCCTATTGCACCAGGCCAGATGAAGGAACCAAGAAGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAAGATAGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATAGATAATCCTGAGGTTAAATAAAATAGTAAAAATGTATAGCCCTGTCAGCATTTTGGACATAAGACAAAGACCAAAGGAACCCTTTAAGGATTATGTAGACCGGTTCTATAAAACTCTAAAGGCTGAACAAGCGTCACAGGATGTAAAAAATTAGATGACAGAAACCTTGTTAGTCCAAAATGCGAATCCAGATTGTAAGACCATTTTAAAAGCATTAAGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCGGCCACAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAAGTCAGCCTCCATAATGGTGCAAGGAGGCAATTTAAAGAACCAAAGAAAGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGACACACAGCCAAAAATTGCAGGGCCCCTAAGAAAAAAGGCTGTTAGAAATGTGGAAAGAAAGGACACCAAATGAAAGATTGTACTAAGAGACAGGCTAATTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAA +MK115095.1,pol,1489,4500,2084,5095,forward,0.7624366800883231,KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK,FFKEDLAFPQGKAKEFSPEQTRANSPASRELQV*GRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIRRQLKEALLDTGADDTVLKEINLPGK*KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK*RKLVDFRELNKRTQDF*KVQLRIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPRVRYQYNVLPQR*KGSPAIFQSSMTKILEPFRKENPDIVIYQYIDDLYVRSDLEIEQHRTKIEELRQHLLK*RLTTPDKKHQKEPPFL*ISYELHPNKWTVQPIQLPDKDS*TVNDIQKLVRKLN*ASQIYPEIKVKQLCKLLRRTKALTEVVPLTEEAELELAENKEILKEPVHRAYYDPSKDLIAEVQKQGGDQWTYQIYQKPFKNLKTKKYARTRGAHTNDVKQLTEAVQKIALEAIVI*RKTPKFKLPIQKET*EM**TEYWQAT*IPE*EFVNTPPLVKL*YQLEKEPIVRAETFYVDRAANRETKLRKARYVTDRRRQKVVSLIDTTNQRTKLHAIHLALQDSGSTVNIVTDSQYALKIIQAQPDKSESELVSQIIEQLIKKEKIYLA*VPAHKRIRRNEQVDKLVSSRIRKVLFLDRIDKAQEEHEKYHSN*RAMASDFNLPPVVAKEIVASCDKCQLKREPMHGQVDCSPGIWQLDCTHLERKIILVAVHVASRYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAAC**ARIKQKFSIPYNPQSQGVVESMNNELKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKRGIGGYSAEERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLL*KGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED*,TTTTTTAAGGAAGATTTGGCCTTCCCACAAGGGAAGGCCAAAGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCGCCAGCAGAGAGCTTCAGGTTTAAGGAAGAGGCAACAGCTCCCCCTCAGAAGCAGGAGACGAAGGACCAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCATAATATCAATAAAAATAAGAAGGCAACTAAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAAAAGAAATAAATTTGCCAGGAAAATAGAAACCAAAAATAATAGAAGGAATTAGAGGTTTTATCAAAGTAAGACAGTATGATCAGGTACCCATAAAAATTTGTAGACATAAAGCTATAAGTACAGTATTAATAAGACCTACACCAGTCAACATAATTAGAAGAAATCTGTTGACCCAGCTTAGTTGCACTTTAAATTTTCCCATCAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATAGATAGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAGGCATTAATAGAAATTTGTGCAGAAATAGAAAAAGAAAGGAAAATTACAAAAATTAGGCCTAAGAATCCATATAATACTCCAGTGTTTGCCATAAAGAAAAAAGACAGTACTAAATAGAGAAAATTAGTAGATTTCCGAGAACTTAATAAAAGAACACAAGACTTTTAAAAAGTTCAACTAAGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTAGGTGATGCATATTTTTCAGTTCCTTTAGACAAAGACTTCAGAAAGTATACTGCATTTACCATACCCAGTATAAACAATGAGGCACCAAGAGTTAGATATCAGTACAATGTGCTTCCACAAAGATAGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAAGAAAATCCAGACATAGTTATCTATCAATACATAGATGATTTGTATGTAAGATCTGACTTAGAAATAGAGCAGCACAGAACAAAAATAGAAGAACTGAGACAACATCTGTTAAAGTAAAGACTCACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTTCTTTAGATAAGTTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATACAGCTGCCAGACAAAGACAGCTAGACTGTCAATGACATACAGAAGTTAGTAAGAAAGTTAAATTAGGCAAGCCAGATCTATCCAGAGATTAAAGTAAAGCAATTATGTAAACTCCTTAGAAGAACCAAAGCACTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAAGGAGATTCTAAAAGAACCAGTACATAGAGCATATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGAGGAGACCAATGGACATATCAAATTTATCAGAAGCCATTTAAAAATCTGAAAACAAAGAAATATGCAAGAACGAGAGGTGCCCACACTAATGATGTAAAACAGTTAACAGAGGCAGTGCAAAAAATAGCCCTAGAAGCCATAGTAATATAGAGAAAGACTCCTAAATTTAAACTACCTATACAAAAAGAAACATAAGAAATGTAGTAGACAGAGTATTGGCAAGCCACCTAGATTCCTGAGTAGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATAGTACCAGTTAGAGAAAGAACCCATAGTAAGAGCAGAAACTTTCTATGTAGATAGGGCAGCTAATAGAGAGACTAAATTAAGAAAAGCAAGGTATGTTACGGACAGAAGAAGACAAAAAGTTGTCTCCCTAATAGACACAACAAATCAGAGGACTAAGTTACACGCAATTCATCTAGCTTTGCAGGATTCAGGATCAACAGTAAACATAGTGACAGACTCACAATATGCCTTAAAGATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGCTAATAAAAAAAGAAAAAATTTACCTGGCATAAGTCCCAGCACACAAAAGAATTAGAAGAAATGAACAAGTAGATAAATTAGTCAGTAGTAGAATCAGAAAAGTACTATTTCTAGATAGAATAGATAAAGCCCAAGAAGAACATGAAAAATATCACAGTAATTAAAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGTTAAAAAGAGAACCTATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAAGAAAAATTATCCTAGTAGCAGTTCATGTAGCCAGTAGATACATAGAAGCAGAAGTTATTGCAGCAGAAACAGGGCAGGAAACAGCATACTTTATCTTAAAATTGGCAGGAAGATGGCCAGTAAAAATAATACATACAGACAATGGCAGCAATTTCACCAGCACTACAGTTAAGGCCGCCTGTTAGTAGGCAAGGATCAAGCAGAAATTTAGTATTCCCTACAATCCTCAAAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAAAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAAGGGGGATTGGGGGGTACAGTGCAGAGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAACTACAAAAACAAATTTCAAAAATTCAAAATTTTCAGGTTTATTACAGGGACAGCAGAGAACCACTTTGGAAAGGACCAGCAAAGCTCCTCTAGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCCTTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAG +MK115095.1,vif,4445,5023,5040,5618,forward,0.7494633160752622,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR,MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR*VYRHHHESHNPKTSSEVHIPLREARLVIKTY*GLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVRPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKRSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAAGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATATTTCAAAGAAAGCTCAGAGATGAGTTTACAGACATCACCATGAAAGCCATAATCCAAAAACAAGTTCAGAAGTACACATCCCATTAAGGGAAGCAAGATTAGTAATAAAAACATATTAAGGTCTGCATACAGGAGAAAGAGACTGGCATTTAGGCCAGGGAGTATCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGGCCTGGCAGACCAACTAATTCACCTGTATTATTTTGATTGTTTTTCAGAATCTGCTATAAGGAATGCCATATTAGGACATAGAGTTAGGCCTAGGTGTGAATATCAGGCAGGACATAACAAGGTAGGATCCCTACAATACTTGGCATTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCCAGTGTTACAAAATTAACAGAGGACAGATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAG +MK115095.1,vpr,4963,5253,5558,5848,forward,0.4464285714285715,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS,MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS*,ATGGAACAAGTCCCAGAGGACCAAAGGCCACAAAAGGAGCCATACAATGAATGGACATTAGAGCTCTTAGAAGAACTTAAGAGTGAAGCTGTTAGGCATTTTCCTAGACCATGGCTTCATAGCTTAGGACAATATATCTATGAAACTTATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAA +MK115095.1,tat_exon1,5111,5452,5829,6044,forward,0.6409453748630458,MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ,MEILGQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPNLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ*,ATGGAGATACTTGGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAAGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAACTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAAGAAAAGGCTTAGGCATCTCCCATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA +MK115095.1,rev_exon1,5373,5450,5968,6045,forward,0.4886988393402566,MAGRSGDSDEELLTAVRIIKRLYQSS,MAGRSGDSDEELLTAVRIIKRLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT +MK115095.1,vpu,5465,5710,6060,6308,forward,0.7521692502681095,MHALEIAAIVRLVVAAIIAIVV,MHALEIAAIVRLVVAAIIAIVV*SIVLIEYKKILRQKKIDRLIDRIRERAEDSGNESDEDQEELSAIVEIGHLVP*DSDDM*,ATGCATGCCTTAGAAATAGCAGCAATAGTAAGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTAGTCTATAGTATTAATAGAATATAAGAAAATTTTAAGACAAAAGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAG +MK115095.1,env,5628,8228,6223,8793,forward,0.7513561129398668,MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD,MKVTRTRKNYQQL*R*GILFLRIVMICSANNL*VTVYYEVPVWKEATTTLFCASDAKAYKTEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISL*DQSLKPCVKLTPLCVTLNCTDELNLNCPNNNTCSNNTKYNMTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD*NDTLKQIVIKLKEKFKNKTIVFNQSSGKDPEIVMHSFNCREEFFYCNTTQLFNST*NNNT*NGTDN*NSTESNSTITLPCRIKQIINLWQEVRRAMYAPPIQGQIRCSSNITGLLLVRDSKSNNSSNDTKTFRPRRGDMKDN*RSELYKYKVVKIEPLRIAPTHAKRRVVQKEKRAIGLRAFFLKFLGAAGSTIGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTV*GIKQLQARVLALERYLKDQQLLKI*GCSRKLICTTNVP*NVS*SPR*NRSLDKI*TNMT*KQ*EKEIDNYTDTIYNLIEQSQNQQEQNEQDLLALDK*ASL*N*FDITQWL*YIKIFIMIVRGLISLRIVFTILSIVNRVRQRYSPLSLQTLLPTQRGPDRPERTEEGGREKDRGTSTRLVHRFLALI*DDLRSLFLFSYHRLRDLLLIVARIVELLRRRK*EALKYW*NLLQY*SQEIKNSAVSLLNTTAIAVAERTDKIIEVLQRGFRAILHIPTRIRQGLEKALL*,ATGAAAGTGACGAGGACCAGGAAGAATTATCAGCAATTGTAGAGATAGGGCATCTTGTTCCTTAGGATAGTGATGATATGTAGTGCCAACAACTTGTAGGTCACAGTCTATTATGAGGTACCTGTATGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAAGACAGAGAAGCATAATGTTTGGGCAACCCATGCCTGTGTACCCACAGACCCCAGCCCACAGGAAGTAGCATTAGAAAATGTGACAGAAACATTTAACATGTGGAAAAATGACATGGTAGAGCAGATGCATGAGGATATAATCAGTTTATAAGATCAAAGCCTAAAGCCATGTGTGAAACTAACCCCACTCTGTGTTACTTTAAATTGCACTGATGAATTAAATCTAAATTGCCCTAACAATAATACTTGTAGTAATAATACTAAATATAATATGACGGAAGAAGGAGAAATAAAAAACTGCTCTTTCAATGTCACCACAGGAATAAGAGATAAGGTGACAAAAGAACATGCACTTTTCTATAAACTTGATGTAGTACCAATAGATGAAAGTAGTGGAAATACTACAGGCAAATATAGGATGATAAATTGTAACACCTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTAGTTTTGCGATTCTAAAGTGTAAAGATAAGAAATTCAATAGAACAGGAGAATGTAGAAATGTCAGCACAGTACAATGTACACATAGAATTAGGCCAGTAGTATCAACTCAACTGCTGCTGAACGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGCCAATCTCTCGAACAATGCTAAAACCATAATAGTACAGCTGAATAAATCTGTAAAAATTAATTGTACAAGACCCAACAATAATACAAGAAGAAGTATACACATAGGACCAAGGAGGGCATTTTATAGAACAGACATAATAGGAGATATAAGACAAGCGCATTGTAACATTAGTAGGAAAGATTAGAATGACACTTTAAAACAGATAGTTATAAAATTAAAAGAAAAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAAAGGACCCAGAGATAGTGATGCATAGTTTTAATTGTAGAGAAGAATTTTTCTACTGTAATACAACACAGCTGTTTAATAGTACTTAGAATAATAATACTTAGAATGGTACTGATAATTAGAATAGTACTGAATCAAATAGCACTATCACACTCCCATGCAGAATAAAACAAATTATAAACTTGTGGCAGGAAGTAAGAAGAGCAATGTATGCCCCTCCCATCCAAGGGCAAATTAGATGTTCATCAAATATTACAGGGCTGCTGCTAGTAAGAGATAGTAAGAGCAACAATAGTAGTAATGATACAAAGACCTTCAGGCCTAGAAGAGGAGATATGAAGGACAATTAGAGAAGTGAATTATATAAATATAAAGTAGTCAAAATTGAACCATTAAGAATAGCACCCACCCATGCAAAGAGAAGAGTGGTGCAGAAAGAAAAAAGAGCAATAGGACTTAGAGCTTTCTTCCTTAAGTTCTTAGGAGCAGCAGGAAGCACTATAGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTAAGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTTTAGAAAGATACCTAAAAGATCAACAGCTCCTGAAGATTTGAGGTTGCTCTAGAAAACTCATTTGCACCACTAATGTGCCCTAAAATGTTAGTTAGAGCCCTAGATAGAATAGATCTCTAGATAAGATTTAGACTAACATGACCTAGAAGCAGTAGGAAAAAGAAATTGACAATTATACAGACACAATATATAACTTAATTGAACAATCACAGAACCAACAAGAACAGAATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAA +MK115095.1,nef,7624,8871,8795,9415,forward,0.5833488893037148,MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC,MNKTY*H*ISRQVCRISLTLHSGYSI*KYS****EA**V*E*FLLYCL**IELGRDTHHCHCRPSSQPRGDPTGPKEQKKEVERKTEAHPRD*CIDS*HSSRTTCGACSSSVTTA*ETYS*LWRGL*NF*DAESKKH*SIGRISCSIRVRK*RIVQLACSTPQQ*Q*LKGQIRL*KYYKEALELFSTYLHE*DRA*KKLCYKIGNKLSRRLRARWPAIKERMRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC*,ATGAACAAGACTTATTAGCATTAGATAAGTAGGCAAGTTTGTAGAATTAGTTTGACATTACACAGTGGCTATAGTATATAAAAATATTCATAATGATAGTAAGAGGCTTGATAAGTTTAAGAATAGTTTTTACTATACTGTCTATAGTGAATAGAGTTAGGCAGAGATACTCACCATTGTCATTGCAGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAGTGCAGTTAGCTTGCTCAACACCACAGCAATAGCAGTAGCTGAAAGGACAGATAAGATTATAGAAGTATTACAAAGAGGCTTTAGAGCTATTCTCCACATACCTACACGAATAAGACAGGGCTTAGAAAAAGCTTTGCTATAAGATAGGTAACAAGTTGTCAAGAAGGCTCAGGGCTAGATGGCCTGCCATAAAAGAAAGAATGAGACAAGCTAGGCCAGTAAGAAAGCCAGAGCCAGCAGCAACTAAGGTAAGAGCAGCATCTCGAGACCTAGAAAGACATGGAGCACTTACAAGTAGCAATACAGCAGCTACCAATGCTGATGTTGCCTGCCTAGAAGCACAACAGGAAGAAAAAGAGGTAGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGGCCAATGACTTACAAAGGAGCTCTAGATATTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAAAGAAGACAAGACATCCTTGATCTGTGGCTCTACAACACACAAGGCTACTTCCCTGACTGGCAGAACTACACACCAAGGCCAGGAGTCAGATTTCCACTGTGTTTTAGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGATAAGGTAGAAGAGGCCAGTGTAGGAGAGAACAACTGCTTGTTAAGCCCCGAAAACCTGCATAGAATAGAAGACGAACACAGAGAAGTATTGCAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTATTACAAGGACTGCTGA +MK115095.1,tat_exon2,7810,7902,8375,8470,forward,0.5303030303030303,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD,RPSSQPRGDPTGPKEQKKEVERKTEAHPRD*,AGACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAG +MK115095.1,rev_exon2,7811,8086,8376,8651,forward,0.6667847862036381,ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE,DPPPNPEGTRQARKNRRRR*RERQRHIHEISA*ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE*,GACCCTCCTCCCAACCCAGAGGGGACCCGACAGGCCCGAAAGAACAGAAGAAGGAGGTAGAGAGAAAGACAGAGGCACATCCACGAGATTAGTGCATAGATTCTTAGCACTCATCTAGGACGACCTGCGGAGCCTGTTCCTCTTCAGTTACCACCGCTTGAGAGACTTACTCTTGATTGTGGCGAGGATTGTAGAACTTCTAAGACGCAGAAAGTAAGAAGCACTGAAGTATTGGTAGAATCTCCTGCAGTATTAGAGTCAGGAAATAAAGAATAG +MK115490.1,gag,549,2048,789,2291,forward,0.3014827756125966,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115490.1,pol,1841,4852,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115490.1,vif,4797,5375,5040,5618,forward,0.378905844492889,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115490.1,vpr,5315,5605,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115490.1,tat_exon1,5586,5801,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115490.1,rev_exon1,5725,5805,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115490.1,vpu,5817,6062,6060,6308,forward,0.5278361344537815,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115490.1,env,5980,8520,6223,8793,forward,0.46021436825118545,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115490.1,tat_exon2,8102,8197,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115490.1,rev_exon2,8103,8378,8376,8651,forward,0.40871934604904625,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115490.1,nef,8522,9136,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +MK115576.1,gag,468,1967,789,2291,forward,0.3014827756125966,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE,MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE*,ATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAA +MK115576.1,pol,1760,4771,2084,5095,forward,0.19610372855115465,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MK115576.1,vif,4716,5294,5040,5618,forward,0.36908151428872715,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH,MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH*,ATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +MK115576.1,vpr,5234,5524,5558,5848,forward,0.31767642387111417,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS,MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS*,ATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MK115576.1,tat_exon1,5505,5720,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG +MK115576.1,rev_exon1,5644,5724,5968,6045,forward,0.4807692307692307,MAGRSGDSDEELLKAVRLIKILYQSSK,MAGRSGDSDEELLKAVRLIKILYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +MK115576.1,vpu,5736,5981,6060,6308,forward,0.5399181166837258,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL,MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL*,ATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAG +MK115576.1,env,5899,8439,6223,8793,forward,0.4583799776107468,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL,MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAA +MK115576.1,tat_exon2,8021,8116,8375,8470,forward,0.32608695652173914,RPTSQPRGDPTGPKESKKKVEKETETDQFD,RPTSQPRGDPTGPKESKKKVEKETETDQFD**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGA +MK115576.1,rev_exon2,8022,8297,8376,8651,forward,0.38952607660679506,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE,DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAG +MK115576.1,nef,8441,9055,8795,9415,forward,0.4624277456647399,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC,MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGA +OQ092466,gag,825,2360,789,2291,forward,0.2559303794507086,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAACCCTAGCCTGTTAGAAACAGCAGAAGGCTGTAGACAAATATTGGGACAGTTACAACCGTCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACATTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGGTAAAAGACACCAAGGAAGCCTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGCAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAGCAGCCAGGTTAGACACACAGGAAACAGCAGCCAGGTCAGCCAAAATTACCCTATAGTACAGAACCTTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGACTACATCCAGTGCATGCAGGGCCCATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAGTAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTACACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGGGGACCCGGACATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCACGTAACAAATTCAAGTGCCATAATGATGCAGAGGGGCAATTTTAGAAACCAAAGAAAGGCTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092466,pol,2147,5164,2084,5095,forward,0.19193360134872262,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAATTTTCTCCAGAGCAGACCAGAGCCAACAGCCCCACCACCAGAAGAGATCTTCAGGTTTGTGGAAGAGACAACAACTCCCTCTCAGAAACAGGAGCCAATAGACAAGGAACTGTATCCTCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGGGCAGATGATACAGTATTAGAAGACATGAATTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAGGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTATTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGCATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGTATGACAAAAATCTTAGAGCCTTATAGAACACGAAATCCAGAAATGGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGACTTAGAAATAGGGCAACATAGAGCAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGATTTACTACCCCAGACAAAAAACATCAAAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAAACAAAGACAGCTGGACTGTCAATGACATACAGAAACTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTAGTACCGCTAACAGAAGAAGCAGAGTTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGGGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGGAAGGACAATGGACATTTCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGCGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACAGAAGGCATAGTAATATGGGGAAAAATTCCTAAATTTAGACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAAACTAAAAAAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATACGCATTGGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTGATAAAAAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTGCTGGAATCAGGAAAGTATTATTTTTAGATGGAATAGAGAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAGTGTCAGCTAAAAGGAGAAGCCATACATGGACAGGTAGACTGTAGTCCAGGAATATGGCAATTAGATTGTACACATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTCATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATACGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATCCAAACCAAAGAACTACAAAAACAAATTATAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTTATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092466,vif,5109,5687,5040,5618,forward,0.24677296886864086,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGTATGTTTCAAGGAAAGCTAAGGGATGGTTTTATAGACATCACTTTGAAAGCAATCATCCAAAAATAAGTTCAGAAGTACACATCCCACTGGAGGATGCTAGACTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGGGTCTCCATAGAATGGAGGAAAAAGAGATATAGCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTACTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACACATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGAGAAAGCCACCCTTGCCTAGTGTTAAGAAGCTAACAGAAGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAG +OQ092466,vpr,5627,5917,5558,5848,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAGCTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAGCTTAGGGCAATATATCTATGAAACTTATGGAGATACTTGGGCAGGGGTGGAAGCCATAATAAGAATTCTGCAACAACTGTTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATTATTCGACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092466,tat_exon1,5898,6113,5829,6044,forward,0.40192926045016075,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ,ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAG +OQ092466,rev_exon1,6037,6117,5968,6045,forward,0.4807692307692307,MAGRSGDSDDELLKTVRLIKVLYQSSK,MAGRSGDSDDELLKTVRLIKVLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAAG +OQ092466,vpu,6129,6374,6060,6308,forward,0.5077548005908421,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL,MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL*,ATGCAACCTTTAACAATATTAGCAATAGTAGCACTAGTAGTAGCAGCAATACTAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAA +OQ092466,env,6292,8874,6223,8793,forward,0.48559709145147756,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL,MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL*,ATGAAAGTGAGGGGGATCAGGAAGAATTATCAGCACTGGTGGAGAGGGGGCATCTTGCTCCTTGGAATGTTGATGATCTGTAATGCTACAGAACAACAATTGTGGGTTACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAAACACCACTCTATTTTGTGCATCAGATGCTAAAGCATATAGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGGTATTAAAAAATGTGACAGAAAATTTTAATATGTGGGAAAATAACATGGTAGAACAGATGCATGAAGATATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAGTTAACTCCACTCTGTGTTACTCTAAATTGCACTAATACCACTAGGAGTAGTGGAAATACTACCAATGAAATGAAAAACTGCTCTTTCTATACCGAAACAGACATAAGAGATAAGAAGAGAAAGGAATATGCACTTTTTTATGAACTTGATATAGTACCCATAGATGAGGATAATAAGAATAAGAGTAATAATATTAGCTATTCTAGGTTAATAAGTTGCAACACCTCAGTTATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAATGATAAGAAATTCAATGGAACAGGGCCATGTACAAATGTCAGCACAGTGCAATGTACACATGGTATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGACGAGGTAGTAATTAAATCTAGCAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTAAATGAAACTGTAAAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGACATAATAGGAGACATAAGACAAGCACATTGTAACATCTCTAGAGCAAACTGGACAAACACTTTAAAACAGATAGCTGAAAAATTAGGAAAACAATTTGAGGAAAATAAAACAATAGTCTTTAATCCCTCCTCAGGAGGGGACCCAGAGGTTGTAATGCACAGTTTTAATTGTAGAGGGGAATTTTTCTACTGTAATTCAACACCACTGTTTAATAGTACTTGGAAGGAGACTAATGGGATTTGGACTCGTATTGGAGAGTCAAATGATAGTGCTACTATCACACTAAATGATAGTGATACTATCACACTCCAATGTAAAATAAGGCAAATTATAAACTTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAAAGGACAAATTAGCTGTTTATCAAACATTACAGGGCTGCTATTAGTAAGAGATGGTGGCAATAACACGAACGGGACCGAGATCTTCAGACCTGTAGGAGGAGAAATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAGAGAGAGAAAAGAGCGACATTGGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATCTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGTAATAAATCTCTGGAAAAAATTTGGAATAATATGACCTGGATGGAGTGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACCTTACTTGAAGAATCGCAGAACCAGCAAGAAAAAAATGAAAAAGAATTATTGGAATTAGATACATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAATAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTACTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTCCAGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAGTGCTGTCAGCTTGCTCAACGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAATATTACAAAGAGCTTGTAGAGCTATTCTCCATATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092466,tat_exon2,8456,8551,8375,8470,forward,0.5303030303030303,RSTPQLRGDPTGPKESKEKVERETETDPVH,RSTPQLRGDPTGPKESKEKVERETETDPVH**,AGATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGA +OQ092466,rev_exon2,8457,8732,8376,8651,forward,0.3690449563855961,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE,DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE*,GATCCACCCCCCAGCTCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGTCCATTAGTGAACGGATTCTTAGCACTTTTCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCTCTCAAATACGGGTGGAGTCTCCTACAATATTGGAGCCAGGAACTAAAGAATAG +OQ092466,nef,8876,9508,8795,9415,forward,0.411658382286489,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC,MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC*,ATGGGTGGCAAATGGTCAAAAAGTAAGCTATTTGGATGGCCTGCTGTAAGGGAAAGAATGAGAAGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAGACACGGAGCAATCACAAGTAGCAATACACCAACTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAAGAGGAGGAGGTGGGTTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCGGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGATCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGTTAGTACCAGTGGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAATAACTGCTTGTTACACCCTATGAGCCAGCATGGGATGGAGGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCGTCACGTGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092463,gag,801,2312,140,1642,forward,0.2589641434262949,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAGCGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAACACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGACCAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGACTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTCAGGAACCAGAGAAAGAATGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092463,pol,2105,5116,1435,4446,forward,0.14797358397500882,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGGTAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAGTCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAGCTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAGCAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAATTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAGAAAGAACCTATAGTAGGAGCAGAAACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGATACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGACCATGAGAAATATCACAGTAATTGGAGGGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGGTATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAACAACAATACATACAGACAATGGCAGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092463,vif,5061,5639,4391,4969,forward,0.32379004771642805,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTATTCATCCAAGAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAGGAGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCAACTAATTCATCGGTATTACTTTGATTGTTTTTCAGAATCTGCCATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092463,vpr,5579,5869,4909,5199,forward,0.34013605442176864,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTCCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAACAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAACCAGTAGATCCTAG +OQ092463,tat_exon1,5850,6068,5180,5398,forward,0.38728632478632474,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*,ATGGAACCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA +OQ092463,rev_exon1,5989,6069,5319,5396,forward,0.3620426829268293,MAGRSGDSDEELIKTVRLIKLLYQSSK,MAGRSGDSDEELIKTVRLIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG +OQ092463,vpu,6081,6329,5411,5656,forward,0.44033465433729635,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGAAATATCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG +OQ092463,env,6244,8826,5574,8123,forward,0.44564023273792597,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTATGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATACCACTAGTACCAAGAATACCACCCCTAGTACCACTGCTAGTAGCGGGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGAAGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAATACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAAGGATTCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTCTTGGAAGGATGAGTCAAATGGCACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAATAATGAGAGCAACACCACCGAGATTTTCAGACCTGAAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAGAGAAATTGACAATTACACAAGCTTGATATACACTTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGACAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCAACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092463,tat_exon2,8408,8503,7705,7797,forward,0.4918032786885247,RPTPQPRGDPTGQKESEKKVERETETDPDH,RPTPQPRGDPTGQKESEKKVERETETDPDH**,AGACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092463,rev_exon2,8409,8684,7706,7981,forward,0.3471418653089562,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCCCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGGAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092463,nef,8828,9460,8125,8751,forward,0.33768732280275404,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTAGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGTTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATAAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTGCCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGATTGCTGA +OQ092465,gag,855,2357,200,1699,forward,0.38383718162342295,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGGTGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAACTAGAACGGTTTGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAACAGATAGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGTACAGCAAGCAGCAACTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAATCTCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAATCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGACTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTGCCATAATGATGCAGAGAGGCAATTTCAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCCCCTAGAAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092465,pol,2150,5161,1492,4503,forward,0.21863141758600757,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTCGGGGAGGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTTGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTTTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGATGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGGTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGTTGCCAGAAAAAGACAGTTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAGGTAAAGCAATTATGTAGACTCCTTAAGGGAACCAAGGCACTAACAGAAGTAGTACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGCAGAGTTACAGAAGCAGGGACAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAGCTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAAACTACCCATACAAAGAGAAACATGGGACACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTTTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAATAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACCACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATCCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAAGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGATGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTGGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTATCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGTGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGCATACCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATCATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATACACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092465,vif,5106,5684,4448,5026,forward,0.3589413907639558,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAAGAAAGCTAAGGGATGGATTTATAAGCATCACTATGACAGTATTAATCCAAAAATAAGTTCAGAAGTTCACATCCCACTAGGGGATGCAAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGGCCTAGCAGACCGACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACGTATAGTTAGTCCTAGTTGTGATTATCAAGCAGGACATAACAAGGTAGGGTCTCTACAGTACTTGGCACTAACAGCACTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092465,vpr,5624,5914,4966,5256,forward,0.2400808693454637,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTACACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCAACATAGCAGAATAGGCATCCTTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092465,tat_exon1,5895,6113,5237,5455,forward,0.2515090543259557,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA +OQ092465,rev_exon1,6034,6114,5376,5453,forward,0.4807692307692307,MAGRSGDSDEELIKTVRLIKLLYQSSK,MAGRSGDSDEELIKTVRLIKLLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG +OQ092465,vpu,6126,6374,5468,5707,forward,0.3726554787759131,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL,MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL*,ATGCAACCTTTAGTAATATCAGCAATAGTAGCATTAGTAGTAGTAGCGATAATAGCAATAGTTGTGTGGTCCATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAATTGATAGAATAAGGGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAG +OQ092465,env,6289,8880,5631,8207,forward,0.48107374453325313,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGCGAGGGGGATCAGGAAGAATTATCAGCACTTGTTGTGGAGATGGGGCACGATGCTCCTTGGGATGTTAATGATCTGTAGCGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTGTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACTGGTGCCAATAATACCACTAGTACCAATACTACCACCCCTAGTACCACTGTTAGTAGCGAGGAAAGGATGGGGGAAGGAGAAATAAAAAACTGCTCTTTCAATATCACCACAAGCCTAAGAGATAAGATGCAGAAAGAATATGCACTCTTTTATAGACCTGATATAGTACCAATAGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACAATAAGACGTTCAATGGATCAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGATAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAAACATAATAGTACATCTGAATAAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATGGGACCAGGGAAAGCATTTTTTGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGAGCAGGTATTTAAAAAGTTAAGAGAACAATTTGGGAATAATAAGACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACATCAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGGTGAAGGGTCAAACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACTCATTAAATGTTCATCAAATATCACAGGGCTACTATTAACAAGAGATGGTGGTAACGAGAGCGAGACCACCGACACTGAGACCTTCAGACCTGTAGGAGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGATTAGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAAAATCTGACACAGATTTGGGATAACATGACCTGGATGCAATGGGAAAAAGAAATTGACAATTACACAAGCTTAATATACACCTTAATTGAAGAATCGCAAAACCAACAAGAAAAGAATGAACTAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCTACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCAGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGGCTTTGCTATAA +OQ092465,tat_exon2,8462,8557,7789,7884,forward,0.5337214944201844,RPTSQPRGDPTGQKESKEKVERETETDPDH,RPTSQPRGDPTGQKESKEKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092465,rev_exon2,8463,8738,7790,8065,forward,0.41220115416323155,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGGAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAGCAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCGGGGGGTGGGAACTCCTCAAGTATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092465,nef,8882,9514,8209,8841,forward,0.3463855421686747,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGGTTGGATGGCCTAAAATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGAACCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTATAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAGAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGATTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092462,gag,767,2269,789,2291,forward,0.316486214000789,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAGCTAAAACATATAGTATGGGCAAGCAGGGAACTAGAGCGATTTGCAGTTAATCCCGGCCTGTTAGAAACATCGGAGGGCTGTAGACAAATACTAGGGCAACTACAGCCCGCTCTTCAGACAGGATCAGAAGAACTTAAATCACTATTTCATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTGAAAGACACCAAAGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAAGAAAAGTAAGAAAAAGGCACAGCAAGCAGCCGCTGACACAGGAAATAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATGCAGGGACAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGATAAGGCTTTCAGTCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAATACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCAGGCAGGGCCTGTTGCGCCAGGCCAGCTACGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAGCAAATAGCATGGATGACACATAATCCACCTGTCCCAGTAGGAGAAATCTATAAAAGATGGATACTTCTGGGATTAAATAAAATAGTAAGAATGTACAGCCCCGTCAGCATTCTGGACATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCTGAGCAGGCTTCACAGGATGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTAGGACCAGCAGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTAGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAGCAAATCCAGCTAGCATAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGCCTATTAAGTGTTTCAACTGTGGCAAAGAGGGGCATATTGCTAAAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092462,pol,2062,5073,2084,5095,forward,0.1943357603710517,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGGTCTGGCCTTCCCGCAAGGGGAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACGACAACTCCCTCTCAGAAACCGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGAGGGCAACTAAAGGAAGCTCTATTAGACACAGGAGCAGATGATACAGTTTTAGAAGAAATGAATTTGCCAGGAAAATGGAAGCCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGCTGCACTTTAAATTTTCCCATTAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAGAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATCTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAATATTTGCCATAAAGAAGAAAGATGGTAATAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCTGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAGGACTTCAGGAAGTATACTGCATTTACAATACCTAGCACAAACAATGAGACACCAGGGATTAGATACCAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTGGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATTTATCAATACATGGATGATTTATATGTAGGGTCTGACTTAGAAATAGGGCAGCATAGAGCAAAAATAGAGGAACTGAGACAACATCTATTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCCGATAAATGGACAGTACAGCCTATATTGCTGCCAGAAAAAGACAGCTGGACTGTTAATGACATACAGAAGTTAGTGGGAAAATTGAACTGGGCAAGTCAGATTTACCCAGGAATCAAAGTAAGGCAGCTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAGTGGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGATTTAATAGCAGAACTACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATATAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGAGGTACCCACACTAATGATATAAAACAATTAACAGAGGCAGTGCAAAAAATAGCTACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAATTACCCATACAAAAGGAAACATGGGAAGCATGGTGGATAGAGTATTGGCAAGCCACCTGGATTCCTGAATGGGAGTTTGTCAATACCCCTCCCTTAGTGAAACTATGGTACCAGTTGGAAAAAGAACCCATAGTGGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGGGAAACTAAATTAGGAAAAGCAGGATATGTTACTGACAAAGGAAGACAAAAAGTTGTCCCCCTAACGGACACAACAAATCAGAAGACTGAGCTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAACTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAGTTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTATAGTAGCAAAGGAAATAGTAGCCAGTTGTGACAAATGTCAGTTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCTGGAATATGGCAGCTAGATTGTACACATCTAAAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTGAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCTGCCTGTTGGTGGGCGGGGATCAAACAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGAAGTAATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCAGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCGTCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACCAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATTATCAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092462,vif,5018,5596,5040,5618,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAGAGTTTAGTAAAACATCATATGCATATATCAAGGAAAGCTAAGAATTGGTTGTATAGACATCACTATGAAAGCATTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTAGTAATAACAACATATTGGGGTCTGCTTACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAGGAGATATAGAACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCTTATTAGGACGTGTAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACCAGGTAGGATCTCTACAGTACTTGGCACTAACAGCATTAATAACACCAAAAAGGAGAAAGCCACCTTTGCCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAG +OQ092462,vpr,5536,5826,5558,5848,forward,0.2608047690014903,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS,MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAAAGGGAGCCATACAATGAATGGGCACTAGAACTTTTAGAGGAACTTAAAAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTTCATGGATTGGGACAGCATATCTATGAAACATATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCGACATAGCAGAATAGGCATTAATCTACAGAGGAGAGCAAGGAATGGATCCAGTAGATCCTAG +OQ092462,tat_exon1,5807,6025,5829,6044,forward,0.37688442211055273,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ,MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ*,ATGGATCCAGTAGATCCTAGCCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTACCAATTGTTATTGTAAAAAGTGCTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAA +OQ092462,rev_exon1,5946,6023,5968,6045,forward,0.4267425320056898,MAGRSGDSDEELLKAVRLIKFLYQSS,MAGRSGDSDEELLKAVRLIKFLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGT +OQ092462,vpu,6038,6283,6060,6308,forward,0.5464940306036659,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL,MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL*,ATGCGACCTTTAGAAATAGCAGCAATAGTAGCACTAGTAGTAGCAGTACTAATAGCAATAGTTGTGTGGTCTATAGTACTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGACAGGATAGTGGATAGAATAAGAGAAAGAGCAGAAGATAGTGGAAATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAG +OQ092462,env,6201,8777,6223,8793,forward,0.5083167934238491,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL,MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL*,ATGAGAGTGAAGGGGATCAGGAGGAATTATCAGCACTGGTGGAGAGGGGGCACCTTGCTCCTTGGGATATTGATGATCTGTAGTGCCACAGAGAACTTGTGGGTCACAGTCTACTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAGATGCCAAAGCATATGATACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAGCCCACAAGAAGTAGTATTGAAAAATGTGACAGAAAAGTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATCAGGATATAATCAGTTTATGGGATGAAAGCCTAAAACCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATGCTACTATCAGTGGTAATGCAACAGAAGAAATAAAAAACTGCTCTTTCAATGTCAATACAAAAATAGGAGGTAAGAAGCAGAAAGAACGTGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAGTACTAATAGGACTAATACCAGCTATAGGTTGATAAGTTGTAACACTTCAGTCATTACACAAGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTGGAGATAAAGAGTTCAATGGAACAGGACTATGTAGAAATGTCAGCACAGTCCAATGTACACATGGAATCAGGCCAGTAGTATCAACTCAATTGCTGTTGAATGGCAGTCTAGCAGAAGGAGAGGTAGTAATTAAATCTGAAAATATCACGAACAATGTTAAAACCATAATAGTACAGCTAAATGAAACTGTATCAATTAATTGTACAAGACCTAGCAACAATACAAGAAGAAGCATACATATGGGACCAGGGAGAGCCTTTTATGCAACAGGAGAAATAATAGGAGATATAAGGAAAGCACAGTGTATCCTGAATAAGACAGACTGGAGTGACACTTTAACAAGGATAGCTAAAAAATTACACAAGCAATTTCATGGACCAATAGCATTTGAGCAATCCTCAGGAGGGGACCCTGAAATTACAATGCACACTTTTAATTGTGGAGGGGAATTTTTCTACTGCAACACATCAGCGTTGTTTAGCGGGACCTGGAATGGTACTGCTTGGACTAATGCTACTTGGGGTAATATTGCAGGTAACAATATCACACTCCAATGCAGAATAAAACAATTTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGAGAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGCAGTAACACAACAAATGGTGGCGAGAATGGGACCCAGATTGGCGAGAATGTGACCCAGATCTTCAGACCTGGAGGAGGGGATATGAGGGACAATTGGAGAAGTGAATTATACAAATATAAAGTAGTAAAAATTGAGCCATTAGGAATAGCACCCACCAAGGCAAAAAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTAACATTCGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACACTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTTCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAGGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATGCTAGTTGGAGTAATAAAACTCTGGAAAAAATTTGGGGGAACATGACCTGGATGGAGTGGGAGAGAGAAATTGACAATTATACAGACTTAATATACACCTTAATTGAACAATCGCAGAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAGGCTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGTTTAGTAGGTTTAAGAATAGTTTTTGCTGTGCTTTCTATAGTAAATAGAGTTAGGCAGGGATACTCACCATTATCATTCCAGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTGTTAGTTTGCTTAATGCTATAGCTATATCAGTAGCGGAGGGAACAGATAGGATTATAGAAGCAATACAAAGAATTTGTAGAGCTATCTTACACATACCTACAAGGATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092462,tat_exon2,8359,8454,8375,8470,forward,0.4034761018001243,RPASQPRGDPTGPKEPTKKVERETETDPDH,RPASQPRGDPTGPKEPTKKVERETETDPDH**,AGACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGA +OQ092462,rev_exon2,8360,8635,8376,8651,forward,0.38952607660679506,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE,DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE*,GACCCGCCTCCCAGCCTCGAGGGGACCCGACAGGCCCGAAGGAACCGACGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGATCATTAGTGAACGGATTCTTAGCACTCATCTGGATCGACCTGCGGAGTCTGTTCCTCTTCAGCTACCTCCGCTTGAGAGACTTACTCTTGATTGCAGCGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092462,nef,8779,9405,8795,9415,forward,0.5049429657794677,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC,MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC*,ATGGGTGGCAAGGGGTCAAAAATGAGGGGATGGGTTGCTGTAAGGGAAAAAATGAGGCGAACTAAGCCAGAAGATGAGCCAGCAGCAAATGGGGTGGGGGCAGCATCTCGAGACTTGGAGAAATATGGCGCACTCACAAGTAGCAATACAGTAGCTACTAATGCTGATTTAGCTTGGCTAGAAGCACAAGAGGAAGAGGAGGTGGGCTTTCCAGTCAGACCTCAAGTACCTTTAAGACCAATGACTTACAAGGGAGCTCTAGATCTCAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGGCAAGATATCCTTGATCTGTGGGTTCACCACACACAAGGCTATCTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCCCTGACTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATCAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATAGAGGACCCGGAGAAAGAAGTCTTAATGTGGAAGTTTGACAGCCACCTAGCATTCCGTCACATGGCCCGAGAGCTGCATCCGGAGTATTACAAAGACTGCTGA +OQ092464,gag,773,2275,200,1699,forward,0.3910844507174782,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ,MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCGGTATTAAGCGGGGGAGAATTAGATAGATGGGAAAGAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGGTTCGCAGTTAATCCTGGCCTGTTAGAAACATCAAAAGGCTGTAGACAAATATTGGAACAGCTACAGCCAGCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATCGATGTAAAAGACACCAAGGAAGCTTTAGATAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGCCAGCCAAAATTACCCTATAGTGCAGAACATTCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCGCTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAACAATGTACACAGGAGGTAAAAAATTGGATGACAGAAACATTATTGGTCCAAAATGCAAACCCAGATTGCAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCTGGCCATAAAGCAAGAGTTTTGGCAGAAGCAATGAGCCAAGTAACAACTCCAGGTACCATAATGATGCAGAGAGGCAATTTAAGGAGCCAAAGAAAGACTGTTAAGTGTTTCAACTGTGGCAAAGAAGGGCATATAGCTAAAAATTGCAGGGCTCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAAGAAGGACACCAAATGAAAGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092464,pol,2068,5079,1492,4503,forward,0.21863141758600757,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAAGAAATGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGACATGACTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTAACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATCTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATATAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTAAGACAACATCTGTTGAAGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAGGACAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAAGCAATTATGTAAACTCCTTAGGGGAACCAAGGCACTAACAGAAGTAATACCACTAACAAGAGAAGCAGAGCTAGAACTGGCAGAGAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCAACAAAAGACTTAATAGTAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGAGGTGCCCACACTAATGATGTAAAACAACTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAGTTTAGACTACCCATACAAAGAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAGACTTTCTATGTAGATGGTGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTTAATCAAATAATAGAACAGTTAATAAAAAAGGACAAGGTATACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGACGATCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGACTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGCCAGTTAAAAGGGGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACACTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCGGCAATTTCATCAGTACTACAGTTAAGGCCGCCTGCTGGTGGGCGGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATACATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAGAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAACTTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092464,vif,5024,5602,4448,5026,forward,0.3264662839130924,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGGACATGGAAAAGTTTAGTAAAACACCATATGTATATTTCAAGGAAAGCTAAGGGATGGGTTTATAAGCATCACTATGACAGTACTCATCCAAGAATAAGTTCAGAAGTTCACATCCCGCTAGGGGATGCGAAATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAGAAGAGATATAGCACACAAGTAGACCCTGGCTTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGCTGTGATTATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAG +OQ092464,vpr,5542,5832,4966,5256,forward,0.2678354029705382,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACACTTTCCTAGGCCATGGCTCCACAGCTTAGGGCAACATATCTATGAAACATATGGAGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCATCATTCAACGGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +OQ092464,tat_exon1,5813,6031,5237,5455,forward,0.2515090543259557,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ,MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ*,ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA +OQ092464,rev_exon1,5952,6029,5376,5453,forward,0.4267425320056898,MAGRSGDSDEELLQTVRLIKLLYQSS,MAGRSGDSDEELLQTVRLIKLLYQSS,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT +OQ092464,vpu,6044,6289,5468,5707,forward,0.4384802297327147,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL,MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL*,ATGCAACCTTTACACATAGCAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGATAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAG +OQ092464,env,6207,8789,5631,8207,forward,0.4684887834843129,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL,MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL*,ATGAGAGTGAGGGGGATCAAGAAGAATTATCAGCACTTGTGGAGATGGGGCATTGTGCTCCTTGGGATGTTAATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACTACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATACAGAGGTACATAATGTTTGGGCTACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGGAAATGTGACAGAGAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGTCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTGAATTGCACTAATTATAATAACACCAATAATACCACTAGTACCAATGATACCACTAGTACCACTACTAGTAGCGGGGAAAAGATGAAGGAAGGAGAGATAAAAAACTGCTCTTTCAATATCACCACAAGCATAAGAGATAAGGTGCAGAAAGAATATGCACTCTTTTATAAACCTGATATAGTACCAATAGATAATGATAATACTAGTTATAGGTTGATAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCAGCTGGTTTTGCGATTCTAAAGTGTAACGATAAGAAGTTCAATGGAACAGGATCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCTCAGACAATGCTAAAACCATAATAGTACATCTGAATGAATCTGTAGAAATTACTTGTATAAGACCCAACAACAATACAAGAAAAAGTATACCTATAGGACCAGGGAGAGCATTTTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAAAATTAATAAAACGAAATGGAATAACACTTTAGACCAGATATTTAAAAAGTTAAGAGAACAATTTGGGAATAAGACAATAATCTTTACTCACTCCTCAGGAGGGGACCCAGAAGTTGTAACGCACAATTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGAGACTAGTTATTGGAAGGATGAAAGGTCAAATGACAATGACACTATCACACTCCCATGCAGAATAAAGCAAATTATAAACCTGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGATACATTAAATGTTCATCAAATATCACAGGGCTGCTAATAACAAGAGATGGTGGGAAAAACGAGAGCAACACCACCGAGACCTTCAGACCTGGAGGAGGAAATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAATAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATAACGCTGACGGTACAGGCCAGACTATTATTGTCTGGTATAGTGCAACAGCAAAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGGATAACATGACCTGGATGGAATGGGAAAGAGAAATTGACAATTACACAAGCTTAATATACACTTTAATTGAAAAATCGCAAAACCAACAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTGACATAACAAAGTGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGCGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAGTGCTATTAGCTTGCTTAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGCTGGGAGAGCTTTTCTCCACATACCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092464,tat_exon2,8371,8466,7789,7884,forward,0.4971219256933542,RPTSQPRGDPTGQKESKKKVERETETDPDH,RPTSQPRGDPTGQKESKKKVERETETDPDH**,AGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGA +OQ092464,rev_exon2,8372,8647,7790,8065,forward,0.3934495959166312,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE,DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE*,GACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCAGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGACCATTAGTGAACGGATTCTTAACAATTATCTGGGTCGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAACTCCTCAAATATTGGTGGAATCTCCTGCAGTATTGGAGTCAGGAACTAAAGAATAG +OQ092464,nef,8791,9411,8209,8841,forward,0.36363636363636354,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC,MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC*,ATGGGTGGTAAGTGGTCAAAGAGTAGTGTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGTGCCTGGCTAGAAGCACAAGAGGATGAGGAGGTGGGTTTTCCAGTCAGGCCTCAGGTACCTTTAAGACCAATGACTTACAAGGGAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGGTATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATGAAGGAGAGAACAACAGCTTGTTACACCCTATGAGCCTGCATGGGATGGATGACCCAGAGAAAGAAGTGTTAGTATGGAGGTTTGACAGTCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGGACTGCTGA +OQ092467,gag,808,2307,789,2291,forward,0.2880084183556755,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ,MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATAAATGGGAAAAAATTCGGTTAAGGCCAGGAGGAAAAAAACAATACAAATTAAAACATCTAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTTCTAGAGACATCAGAAGGGTGTAGACAAATACTGGGACAGCTACAACCAGCTCTTCAGACAGGATCAGAAGAATTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAAATAGAGGAAGAGCAAAACCAAAGTAAGAAAAAAGCAGCAGCTGCAGCAGCTGACACAGGAAACAGAAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCTTTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTACAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAATAGGTGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAGGCAGGGCCTGTTGCACCAGGCCAAATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTAACCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGATATCTATAAAAGATGGATAATTCTGGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTGAGAGCCGAGCAAGCAACACAGGAAGTAAAGAATTGGATGACAGAAACTTTGCTGGTCCAAAATGCAAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCAGGCCACAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAACTGTAATGATGCAGAGAGGCAATTTTAGGAATCAAAGAAAGACAGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCATATAGCAAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAAAGAAGGGCACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAA +OQ092467,pol,2100,5111,2084,5095,forward,0.1880239208210378,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGGAGGCCAGGGAATTTTCTTCAGAGCAAACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGGGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAAATCACTCTTTGGCAACGACCCCTCGTCACAATAAAAATAGGGGGGCAGCTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGATATGAATTTACCAGGAAAATGGAAACCAAAAATGATAGGAGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCGTAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGCTGTACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGATAGTACTAAATGGAGAAAGTTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCGCATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGTGATGCCTATTTTTCAATTCCCTTAGATAAAGACTTCAGGAAGTACACTGCATTTACCATACCTAGTACAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAGGATATTAGAACCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTGGGATCTGACTTAGAAATAGGACAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTGAAGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAAAGCTGCCAGAAAAAGATAGCTGGACTGTCAATGACATCCAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTATGCAGGAATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACTAAAGCACTAACAGAAGTAGTACCACTAACAGCAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGAACCGGTACATGGAGTGTATTATGACCCAACGAAAGACCTAATAGCAGAACTACAGAAGCAGGGGCAAAGTCAATGGACATATCAAATTTATCAAGAACCATTTAAAAATCTGAAAACAGGAAAGTATGCAAGAATGAGGGGTGCCCACACTAATGATGTGAAACAATTAACAGAGGCAGTGCAAAAAATAGCCATAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAAATTACCTATACAAAAAGAAACATGGGAAACATGGTGGACAGACTATTGGCAAGCCACCTGGATTCCTGATTGGGAGTTTGTCAATACCCCTCCCTTAGTAAAATTATGGTACCAGTTAGAAAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAGATCAGGCAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCCCCCTAACAGACACAACAAACCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTGACAGACTCACAATATGCACTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAGTCAAATAATAGAGCAGTTAATAAAGAAGGAAAAGGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTTCTGGAATCAGGAAGATACTATTTTTAGATGGAATAACTAAGGCCCAAGATGATCATGAGAGATACCACAGCAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTATAATAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCACGCATGGACAAGTAGACTGCAGTCCAGGAATATGGCAACTAGATTGTACGCATTTAGAAGGAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTCTCTTAAAACTAGCAGGAAGATGGCCAGTAAAGACAGTACATACAGATAATGGCAGCAATTTCACCAGTGCTGCGGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAAAGTCAAGGAGTCATAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAAGTAAGAGAGCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAGAAACAAATCACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAGGCAAAGATCATTAGAGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +OQ092467,vif,5056,5634,5040,5618,forward,0.41532297468972923,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH,MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATACATGTCTCAAAGAAAGCTAAGGGATGGGTTTATAGACACCACTATGAAAGCACCCATCCAAGAATAAGTTCAGAAGTACATATCCCGCTAGGGGAAGCTAGATTAGTAATAGCAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCACTTGGGTCAGGGAGTCTCCATAGAATGGAGGGAAAAGAAATATATCACACAAGTAGACCCTGACCTAGCAGACCAACTAATTCATCTGCATTATTTTGATTGTTTTTCAGAGTCTGCTATAAGAAATGCCATAGTAGGACGTTTAGTTAGCCCTCAGTGTGAATATCAAACAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCACTAGTAGCATTAATAACGCCAAAAAAGAGAAAGCCACCTTTGCCTAGTGTTAGGAAATTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAG +OQ092467,vpr,5574,5864,5558,5848,forward,0.3120665742024965,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGACCACAGAGGGAGCCATATAATGAGTGGACACTAGAGCTTTTAGAGGAACTTAAGAGTGAAGCTGTTAGACATTTTCCTAGGATATGGCTCCATAACTTAGGACAATACATCTATGCAACTTATGGGGATACTTGGACAGGAGTGGAAGCTTTAATAAGAATTCTGCAACAACTGCTGTTTATTCATTTCAGAATTGGATGTCAACATAGCAGAATAGGCATTACTCGACAGAGGAGAGCAAGGAATGGAGCCAGTAGATCCTAG +OQ092467,tat_exon1,5845,6063,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ,MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTCTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAA +OQ092467,rev_exon1,5984,6064,5968,6045,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKQLYQSSK,MAGRSGDSDEDLLKTVRLIKQLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAACAGTGAGACTCATCAAGCAGCTCTATCAAAGCAGTAAG +OQ092467,vpu,6076,6339,6060,6308,forward,0.4955621301775147,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL,MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL*,ATGCAACCCTTAGTAATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAGAAAGATAGATAGCATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAG +OQ092467,env,6239,8806,6223,8793,forward,0.4703403690377699,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL,MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL*,ATGAGAGTGAAGGAGATCAGGAAGAATTGTCGGCACTTGTGGAGATGGGGCACCATGTGGAAATGGGGCACCATGCTCCTTGGAATGTTGATGATCTGTAGTGCTAAAGAACAATTGTGGGTCACAGTTTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTTTATTTTGTGCATCAAATGCTAAAGCATATGACCCAGAGGTGCATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACAAGAAGTACCATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGACATAATCAGTTTATGGGATCAAAGCTTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTATTTTAAATTGCACTAATGTGAATGTTACTACTAACAATAATAGTAGTAGTGAGGAACAGATGGAGGTAGGAGAAATAAAAAACTGCTCTTTCAATATTGCCACAAGAATAAAAAATAAGATAAAGAAAGAATATGCACTTTTTAATAGACTTGATGTAGTACCAATAGAGGATGATAATACAAGCTATATGTTGATAAATTGTAATACCTCAGTCACTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATACTAAAATGTAATGATAAAAAGTTCAATGGAACAGGACCATGTAACAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGATAGTAGTTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACAGCTGAATAAAACTATAGAAATTAATTGTATAAGACCCAACAATAATACAAGAAAAAGTATATCTTTAAGACCGGGGCAAGCAATTTATGCAACAGAAGACATAATAGGAAATATAAGACAAGCACATTGTAACATTAGGAGAAAAGACTGGGATAAAGCTTTAGAACAGGTAGTTGCAAAATTAAGAGAACAATTTAAGAATAAAACAATAGTCTTTAATCAATCCTCAGGAGGAGACCCAGAAATTGTAATGCATAGTTTTAATTGTGCAGGGGAATTTTTCTACTGTAACACAACAAAGCTGTTTAATAGTACTTGGAATGTTAATAACACTCGGAATAATACTACTGATAATAGCACCATCACTCTCCCGTGCAGAATAAAACAAATTATAAACAGATGGCAGGAAGTAGGAAAAGCAATGTATGCTCCTCCCATCAAAGGGCAAATTAAATGTTCATCAAATATTACAGGGTTATTATTAACAAGAGATGGTGGTGTCCGCGAGGACAACGCCCCTGAGATCTTTAGACCTGGAGGAGGAGATATGAGGGATAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTGGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAAAGAGGAAAAAGAGCAGTAACGCTGGGAGCTATGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGGCAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACTTACAGGATCAACAGCTCCTAGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTACCTTGGAATACTAGTTGGAGTAATAAATCTTTGGAAAAGATTTGGAAAAACATGACCTGGATGGAGTGGGAGAAAGAAATTAACAATTACACAAGGACAATATACACCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAGGAATTATTGGAATTGGATAAGTGGGCAAGTTTGTGGAATTGGTTTGACATAACAAACTGGCTGTGGTATATAAAAATATTCATCATGATAGTAGGAGGTATAGTAGGGTTAAGAATAGTTTTTACTGTGCTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTGTCATTCCAGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAGTTTGCTTAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAATTGGTAGAGCTATTCTCCACATCCCTAGAAGAATAAGACAGGGCTTAGAAAGGGCTTTGCTATAA +OQ092467,tat_exon2,8388,8483,8375,8470,forward,0.4918032786885247,RPASQLRGDQTGPKEQKKKVERETETDPGN,RPASQLRGDQTGPKEQKKKVERETETDPGN**,AGACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGA +OQ092467,rev_exon2,8389,8673,8376,8651,forward,0.4123815285339786,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC,DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC*,GACCCGCTTCCCAGCTCCGAGGGGACCAGACAGGCCCGAAGGAACAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGGGCAATTAGTGAACGGATTCTTTGCGCTTATCTGGGACGACCTGCAGAGCCTGTGCCTCTTCAGCTACCGCCGCTTGAGAGACTTACTCTTGATTGTAGCGAGGATTGTGGAACTTCTGGGACACAGGGGGTGGGAGGCCCTCAAATATTGGTGGAATCTCCTGCAGTACTGGAGTCAGGAACTAAAGAAGAGTGCTGTTAG +OQ092467,nef,8808,9416,8795,9415,forward,0.484764542936288,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC,MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC*,ATGGGTGGCAAGTGGTCAAAATGTAGTCTGGTTGGATGGCCTGCTATAAGGGAAAGAATGAGACGAGCTGAGCCAGCTCCAGCAGCAGAAGGGGTGGGAGCAGCATCTCGAGACTTGGAAAAACATGGAGCACTCACAACTAGTAATACAGCAGCTAATAATGCTGCTTGTGCCTGGCTGGAAGCACAAGAGGAGGAAGAGGTGGGGTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGGAGCTATGGATCTTGGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCCAAAAAGACAAGAAATCCTTGATCTGTGGGTCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTATACACCAGGGCCAGGGACTAGATATCCATTAACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCAGATGAAGGAGAGAATAGCTGTTTGCTACACCCGATGAACCAGCATGGGGCAGATGACACAGAAAGAGAAGTATTAATGTGGAAGTTTGACAGCAGCCTAGCATTTCATCACAAGGCCCGAGAGCTGCATCCGGAGTACTACAAAAACTGCTGA diff --git a/tests/expected-results-large-hxb2/errors.json b/tests/expected-results-large-hxb2/errors.json index ecef12f..82efca8 100644 --- a/tests/expected-results-large-hxb2/errors.json +++ b/tests/expected-results-large-hxb2/errors.json @@ -3,52 +3,52 @@ { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 2721" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 2721" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6322" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6322" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" + "message": "Smaller ORF vif at 5040-5618 can have maximum insertions 90, got 909" }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" + "message": "Smaller ORF vpr at 5558-5848 can have maximum deletions 30, got 66" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004" + "message": "Smaller ORF rev_exon1 at 5968-6045 contains an internal stop codon at 6004" }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions." + "message": "Smaller ORF vpu at 6060-6308 contains out of frame indels that impact 190 positions." }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 51 positions." }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 96" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 867" }, { "sequence_name": "KX505501.1", @@ -70,59 +70,59 @@ { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6123" }, { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" } ], "MN692074": [ { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 981" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 981" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6550" }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" + "message": "Smaller ORF vif at 5040-5618 can have maximum deletions 30, got 81" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" + "message": "Smaller ORF vpr at 5558-5848 can have maximum insertions 90, got 207" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" + "message": "Smaller ORF vpu at 6060-6308 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 40 positions." }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 204" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 882" }, { "sequence_name": "MN692074", @@ -140,12 +140,12 @@ { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 822" + "message": "ORF gag at 789-2291 contains an internal stop codon at 822" }, { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MN090335", @@ -172,7 +172,7 @@ { "sequence_name": "MN090376", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 822" + "message": "ORF gag at 789-2291 contains an internal stop codon at 822" }, { "sequence_name": "MN090376", @@ -256,7 +256,7 @@ { "sequence_name": "MK115211.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6889" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6889" }, { "sequence_name": "MK115211.1", @@ -295,59 +295,59 @@ { "sequence_name": "MK114705.1", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum deletions 30, got 186" + "message": "Smaller ORF nef at 8795-9415 can have maximum deletions 30, got 186" } ], "MK114856.1": [ { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 873" + "message": "ORF gag at 789-2291 contains an internal stop codon at 873" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2213" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2213" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6325" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6325" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5172" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5172" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5594" + "message": "Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5594" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5919" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5919" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8852" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8852" }, { "sequence_name": "MK114856.1", @@ -359,42 +359,42 @@ { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 834" + "message": "ORF gag at 789-2291 contains an internal stop codon at 834" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6349" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6349" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5373" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5373" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5717" + "message": "Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5717" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115009.1", @@ -416,7 +416,7 @@ { "sequence_name": "MK115387.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" } ], "MK115491.1": [], @@ -424,7 +424,7 @@ { "sequence_name": "MK116110.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 834" + "message": "ORF gag at 789-2291 contains an internal stop codon at 834" }, { "sequence_name": "MK116110.1", @@ -447,7 +447,7 @@ { "sequence_name": "MK114997.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6511" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6511" } ], "MK115518.1": [], @@ -477,47 +477,47 @@ { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 924" + "message": "ORF gag at 789-2291 contains an internal stop codon at 924" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6424" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6424" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5247" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5247" }, { "sequence_name": "MK115464.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains out of frame indels that impact 104 positions." + "message": "Smaller ORF tat_exon1 at 5829-6044 contains out of frame indels that impact 104 positions." }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115464.1", @@ -530,7 +530,7 @@ { "sequence_name": "MK115520.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2198" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2198" }, { "sequence_name": "MK115520.1", @@ -583,42 +583,42 @@ { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 927" + "message": "ORF gag at 789-2291 contains an internal stop codon at 927" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6550" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5151" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5151" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115095.1", diff --git a/tests/expected-results-large-hxb2/holistic.json b/tests/expected-results-large-hxb2/holistic.json index 2b57969..250dea5 100644 --- a/tests/expected-results-large-hxb2/holistic.json +++ b/tests/expected-results-large-hxb2/holistic.json @@ -6,9 +6,9 @@ "blast_matched_qlen": 1997, "blast_sseq_coverage": 0.2498456472525211, "blast_qseq_coverage": 1.2158237356034052, - "blast_sseq_orfs_coverage": 0.17663960024984385, + "blast_sseq_orfs_coverage": 0.17666166916541728, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN691959": { @@ -20,7 +20,7 @@ "blast_qseq_coverage": 1.1086063415148004, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN692074": { @@ -30,9 +30,9 @@ "blast_matched_qlen": 4178, "blast_sseq_coverage": 0.5042189750977567, "blast_qseq_coverage": 1.1728099569171853, - "blast_sseq_orfs_coverage": 0.4114928169893816, + "blast_sseq_orfs_coverage": 0.411544227886057, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN692145": { @@ -44,7 +44,7 @@ "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN090335": { @@ -54,9 +54,9 @@ "blast_matched_qlen": 9069, "blast_sseq_coverage": 0.9842560197571517, "blast_qseq_coverage": 1.0603153600176425, - "blast_sseq_orfs_coverage": 1.0003747657713928, + "blast_sseq_orfs_coverage": 1.000374812593703, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN090376": { @@ -66,9 +66,9 @@ "blast_matched_qlen": 8985, "blast_sseq_coverage": 0.9784935171846059, "blast_qseq_coverage": 1.0604340567612687, - "blast_sseq_orfs_coverage": 0.9943785134291068, + "blast_sseq_orfs_coverage": 0.9943778110944528, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115581.1": { @@ -80,7 +80,7 @@ "blast_qseq_coverage": 1.0046340179041602, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115690.1": { @@ -92,7 +92,7 @@ "blast_qseq_coverage": 1.0113530808132933, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115571.1": { @@ -104,7 +104,7 @@ "blast_qseq_coverage": 1.0113902490951672, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115514.1": { @@ -116,7 +116,7 @@ "blast_qseq_coverage": 1.0173736943082499, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115488.1": { @@ -128,7 +128,7 @@ "blast_qseq_coverage": 1.0325262392185388, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK115030.1": { @@ -140,7 +140,7 @@ "blast_qseq_coverage": 1.0655270655270654, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115498.1": { @@ -152,7 +152,7 @@ "blast_qseq_coverage": 1.0080329774865235, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115211.1": { @@ -164,7 +164,7 @@ "blast_qseq_coverage": 1.0598981399468557, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115158.1": { @@ -176,7 +176,7 @@ "blast_qseq_coverage": 1.043749316416931, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK114705.1": { @@ -188,7 +188,7 @@ "blast_qseq_coverage": 1.122622463075125, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK114856.1": { @@ -200,7 +200,7 @@ "blast_qseq_coverage": 1.0812493405085997, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MK115009.1": { @@ -212,7 +212,7 @@ "blast_qseq_coverage": 1.0590854784403172, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115387.1": { @@ -224,7 +224,7 @@ "blast_qseq_coverage": 1.040936952714536, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115491.1": { @@ -236,7 +236,7 @@ "blast_qseq_coverage": 1.0299299511780937, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK116110.1": { @@ -246,9 +246,9 @@ "blast_matched_qlen": 8967, "blast_sseq_coverage": 0.9846676270837621, "blast_qseq_coverage": 1.0635664101706257, - "blast_sseq_orfs_coverage": 0.9986258588382261, + "blast_sseq_orfs_coverage": 0.9986256871564217, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MK115527.1": { @@ -260,7 +260,7 @@ "blast_qseq_coverage": 1.0056956017297753, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK114997.1": { @@ -272,7 +272,7 @@ "blast_qseq_coverage": 1.0516841524019878, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115518.1": { @@ -284,7 +284,7 @@ "blast_qseq_coverage": 0.9996854356715948, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115065.1": { @@ -296,7 +296,7 @@ "blast_qseq_coverage": 1.069459518124593, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK115464.1": { @@ -308,7 +308,7 @@ "blast_qseq_coverage": 0.9893407844354756, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115530.1": { @@ -320,7 +320,7 @@ "blast_qseq_coverage": 0.9992665549036044, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115520.1": { @@ -330,9 +330,9 @@ "blast_matched_qlen": 9589, "blast_sseq_coverage": 0.9786993208479111, "blast_qseq_coverage": 0.987902805297737, - "blast_sseq_orfs_coverage": 1.0121174266083697, + "blast_sseq_orfs_coverage": 1.012118940529735, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115503.1": { @@ -344,7 +344,7 @@ "blast_qseq_coverage": 0.9953207861079338, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115570.1": { @@ -356,7 +356,7 @@ "blast_qseq_coverage": 1.0057986294148655, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115509.1": { @@ -368,7 +368,7 @@ "blast_qseq_coverage": 1.0197797498128942, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115702.1": { @@ -378,9 +378,9 @@ "blast_matched_qlen": 9098, "blast_sseq_coverage": 0.9874459765383824, "blast_qseq_coverage": 1.0596834469114091, - "blast_sseq_orfs_coverage": 1.0198625858838226, + "blast_sseq_orfs_coverage": 1.0198650674662668, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MK115095.1": { @@ -392,7 +392,7 @@ "blast_qseq_coverage": 1.060085367188355, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115490.1": { @@ -404,7 +404,7 @@ "blast_qseq_coverage": 1.0204343639670483, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115576.1": { @@ -416,7 +416,7 @@ "blast_qseq_coverage": 1.0342110943233327, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092466": { @@ -428,7 +428,7 @@ "blast_qseq_coverage": 1.1192442700805285, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092463": { @@ -440,7 +440,7 @@ "blast_qseq_coverage": 1.1118167621030712, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092465": { @@ -452,7 +452,7 @@ "blast_qseq_coverage": 1.108292783932084, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092462": { @@ -464,7 +464,7 @@ "blast_qseq_coverage": 1.1301214741610048, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092464": { @@ -476,7 +476,7 @@ "blast_qseq_coverage": 1.115634156550858, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092467": { @@ -488,7 +488,7 @@ "blast_qseq_coverage": 1.0962157809983897, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-large-hxb2/orfs.json b/tests/expected-results-large-hxb2/orfs.json index a7e0d52..205cc1d 100644 --- a/tests/expected-results-large-hxb2/orfs.json +++ b/tests/expected-results-large-hxb2/orfs.json @@ -3,9 +3,9 @@ { "name": "env", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7623480451210163, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -15,9 +15,9 @@ { "name": "vif", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7647696476964769, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -27,9 +27,9 @@ { "name": "nef", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.764345579086969, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -39,9 +39,9 @@ { "name": "tat_exon1", "start": 1, - "end": 1750, + "end": 1749, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7680130480667754, "protein": "MRKLQNGIDCIQCMQGLLHQAR", @@ -51,9 +51,9 @@ { "name": "gag", "start": 336, - "end": 1824, + "end": 1823, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3997973809613161, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -63,9 +63,9 @@ { "name": "rev_exon1", "start": 1306, - "end": 1750, + "end": 1749, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.758082497212932, "protein": "MRTQIVKLF", @@ -75,9 +75,9 @@ { "name": "vpr", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.763687959047407, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -87,9 +87,9 @@ { "name": "vpu", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7672672672672673, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -99,9 +99,9 @@ { "name": "pol", "start": 1627, - "end": 1927, + "end": 1926, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7724330674761569, "protein": "GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -111,9 +111,9 @@ { "name": "tat_exon2", "start": 1746, - "end": 1824, + "end": 1823, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.7616257781032589, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", @@ -123,9 +123,9 @@ { "name": "rev_exon2", "start": 1747, - "end": 1927, + "end": 1926, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7620186257236345, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -137,9 +137,9 @@ { "name": "gag", "start": 639, - "end": 2142, + "end": 2141, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.0801186943620179, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -149,9 +149,9 @@ { "name": "pol", "start": 1934, - "end": 4946, + "end": 4945, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.054722889368558514, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -161,9 +161,9 @@ { "name": "vif", "start": 4890, - "end": 5469, + "end": 5468, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -173,9 +173,9 @@ { "name": "vpr", "start": 5408, - "end": 5699, + "end": 5698, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", @@ -185,21 +185,21 @@ { "name": "tat_exon1", "start": 5679, - "end": 5898, + "end": 5894, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5818, - "end": 5899, + "end": 5898, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", @@ -209,9 +209,9 @@ { "name": "vpu", "start": 5910, - "end": 6156, + "end": 6155, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7333193453629878, "protein": "MQPIQIAIVALVVAIIIAIVV", @@ -221,9 +221,9 @@ { "name": "env", "start": 6070, - "end": 8656, + "end": 8655, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.1405525502318391, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", @@ -233,9 +233,9 @@ { "name": "tat_exon2", "start": 8237, - "end": 8333, + "end": 8332, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6672629695885509, "protein": "RPTSQTRGDPTGPKE", @@ -245,9 +245,9 @@ { "name": "rev_exon2", "start": 8238, - "end": 8514, + "end": 8513, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.210025203024363, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", @@ -257,9 +257,9 @@ { "name": "nef", "start": 8657, - "end": 9278, + "end": 9277, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.06582796957284964, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -271,9 +271,9 @@ { "name": "nef", "start": 0, - "end": 4059, + "end": 4058, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7628009106462086, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -283,9 +283,9 @@ { "name": "env", "start": 2, - "end": 4115, + "end": 4114, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.76033143808071, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -295,9 +295,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.19470123431286457, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -307,9 +307,9 @@ { "name": "pol", "start": 2084, - "end": 4115, + "end": 4114, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.5617851221088768, "protein": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -319,9 +319,9 @@ { "name": "vif", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7631664499349805, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -331,9 +331,9 @@ { "name": "vpr", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.7629151983204618, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -343,9 +343,9 @@ { "name": "vpu", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7634058115037564, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -355,9 +355,9 @@ { "name": "tat_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7659115426105717, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -367,9 +367,9 @@ { "name": "rev_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7610789980732178, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -379,9 +379,9 @@ { "name": "tat_exon2", "start": 4080, - "end": 4164, + "end": 4163, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.769292994661058, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", @@ -391,9 +391,9 @@ { "name": "rev_exon2", "start": 4081, - "end": 4153, + "end": 4152, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7667894365645325, "protein": "YPVASPQMLHISSCFLPVLGLSG", @@ -405,9 +405,9 @@ { "name": "gag", "start": 775, - "end": 2281, + "end": 2280, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.20784453738651432, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", @@ -417,9 +417,9 @@ { "name": "pol", "start": 2070, - "end": 5085, + "end": 5084, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.14843087362171337, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", @@ -429,9 +429,9 @@ { "name": "vif", "start": 5029, - "end": 5608, + "end": 5607, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", @@ -441,9 +441,9 @@ { "name": "vpr", "start": 5547, - "end": 5838, + "end": 5837, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", @@ -453,9 +453,9 @@ { "name": "tat_exon1", "start": 5818, - "end": 6037, + "end": 6036, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -465,9 +465,9 @@ { "name": "rev_exon1", "start": 5957, - "end": 6038, + "end": 6037, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -477,9 +477,9 @@ { "name": "vpu", "start": 6049, - "end": 6298, + "end": 6297, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.520618556701031, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", @@ -489,9 +489,9 @@ { "name": "env", "start": 6212, - "end": 8783, + "end": 8782, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", @@ -501,9 +501,9 @@ { "name": "tat_exon2", "start": 8364, - "end": 8460, + "end": 8459, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -513,9 +513,9 @@ { "name": "rev_exon2", "start": 8365, - "end": 8641, + "end": 8640, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -525,9 +525,9 @@ { "name": "nef", "start": 8784, - "end": 9387, + "end": 9386, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", @@ -539,9 +539,9 @@ { "name": "gag", "start": 315, - "end": 1665, + "end": 1664, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.596665989022159, "protein": "MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ", @@ -551,9 +551,9 @@ { "name": "pol", "start": 1427, - "end": 4469, + "end": 4468, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.27887169154684477, "protein": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -563,9 +563,9 @@ { "name": "vif", "start": 4413, - "end": 4992, + "end": 4991, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH", @@ -575,9 +575,9 @@ { "name": "vpr", "start": 4931, - "end": 5222, + "end": 5221, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3808935556928146, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", @@ -587,21 +587,21 @@ { "name": "tat_exon1", "start": 5202, - "end": 5421, + "end": 5417, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", - "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*", - "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA" + "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", + "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG" }, { "name": "rev_exon1", "start": 5341, - "end": 5422, + "end": 5421, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", @@ -611,9 +611,9 @@ { "name": "vpu", "start": 5433, - "end": 5682, + "end": 5681, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5244381020335356, "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", @@ -623,9 +623,9 @@ { "name": "env", "start": 5596, - "end": 8158, + "end": 8157, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5152420275849952, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", @@ -635,9 +635,9 @@ { "name": "tat_exon2", "start": 7739, - "end": 7835, + "end": 7834, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6842105263157894, "protein": "RPSSQPRGDQTGPKE", @@ -647,9 +647,9 @@ { "name": "rev_exon2", "start": 7740, - "end": 8016, + "end": 8015, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", @@ -659,9 +659,9 @@ { "name": "nef", "start": 8159, - "end": 8813, + "end": 8812, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4891015417331206, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", @@ -673,9 +673,9 @@ { "name": "gag", "start": 522, - "end": 1590, + "end": 1589, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.6828741441147701, "protein": "MYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP", @@ -685,9 +685,9 @@ { "name": "pol", "start": 1382, - "end": 4394, + "end": 4393, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.23966680468616797, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", @@ -697,9 +697,9 @@ { "name": "vif", "start": 4338, - "end": 4920, + "end": 4919, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.42479043044174425, "protein": "MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH", @@ -709,9 +709,9 @@ { "name": "vpr", "start": 4859, - "end": 5150, + "end": 5149, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.36116422349691957, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -721,21 +721,21 @@ { "name": "tat_exon1", "start": 5130, - "end": 5349, + "end": 5345, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.46628407460545196, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5269, - "end": 5350, + "end": 5349, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5763097949886105, "protein": "MAGRSGDSDEELLRIAGTIKFLYQSSK", @@ -745,9 +745,9 @@ { "name": "vpu", "start": 5361, - "end": 5631, + "end": 5630, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5680096940321115, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL", @@ -757,9 +757,9 @@ { "name": "env", "start": 5524, - "end": 8110, + "end": 8109, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.49863720871464445, "protein": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -769,9 +769,9 @@ { "name": "tat_exon2", "start": 7691, - "end": 7784, + "end": 7783, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -781,9 +781,9 @@ { "name": "rev_exon2", "start": 7692, - "end": 7968, + "end": 7967, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -793,9 +793,9 @@ { "name": "nef", "start": 8111, - "end": 8735, + "end": 8734, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5036770338593534, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -807,9 +807,9 @@ { "name": "gag", "start": 680, - "end": 2180, + "end": 2179, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -819,9 +819,9 @@ { "name": "pol", "start": 1972, - "end": 4984, + "end": 4983, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -831,9 +831,9 @@ { "name": "vif", "start": 4928, - "end": 5507, + "end": 5506, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -843,9 +843,9 @@ { "name": "vpr", "start": 5446, - "end": 5737, + "end": 5736, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -855,9 +855,9 @@ { "name": "tat_exon1", "start": 5717, - "end": 5936, + "end": 5935, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -867,21 +867,21 @@ { "name": "rev_exon1", "start": 5856, - "end": 5937, + "end": 5933, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5948, - "end": 6194, + "end": 6193, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -891,9 +891,9 @@ { "name": "env", "start": 6111, - "end": 8652, + "end": 8651, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -903,9 +903,9 @@ { "name": "tat_exon2", "start": 8233, - "end": 8329, + "end": 8328, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -915,9 +915,9 @@ { "name": "rev_exon2", "start": 8234, - "end": 8510, + "end": 8509, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -927,9 +927,9 @@ { "name": "nef", "start": 8653, - "end": 9268, + "end": 9267, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -941,9 +941,9 @@ { "name": "gag", "start": 777, - "end": 2286, + "end": 2285, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.24076694150363465, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ", @@ -953,9 +953,9 @@ { "name": "pol", "start": 2078, - "end": 5090, + "end": 5089, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.185747174550021, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -965,9 +965,9 @@ { "name": "vif", "start": 5034, - "end": 5613, + "end": 5612, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.39766435115272314, "protein": "MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH", @@ -977,9 +977,9 @@ { "name": "vpr", "start": 5552, - "end": 5843, + "end": 5842, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS", @@ -989,21 +989,21 @@ { "name": "tat_exon1", "start": 5823, - "end": 6042, + "end": 6038, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", - "aminoacids": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5962, - "end": 6043, + "end": 6042, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDNDEDLLKTVRFIKLLYQSSK", @@ -1013,9 +1013,9 @@ { "name": "vpu", "start": 6054, - "end": 6300, + "end": 6299, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.48542752364408415, "protein": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL", @@ -1025,9 +1025,9 @@ { "name": "env", "start": 6217, - "end": 8800, + "end": 8799, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.49751604598034604, "protein": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ", @@ -1037,9 +1037,9 @@ { "name": "tat_exon2", "start": 8381, - "end": 8474, + "end": 8473, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPTSQPRGDPTGPKEPETKVESKTETDPLT", @@ -1049,9 +1049,9 @@ { "name": "rev_exon2", "start": 8382, - "end": 8658, + "end": 8657, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.42982806877249113, "protein": "DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE", @@ -1061,9 +1061,9 @@ { "name": "nef", "start": 8801, - "end": 9425, + "end": 9424, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.459649710885779, "protein": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN", @@ -1075,9 +1075,9 @@ { "name": "gag", "start": 579, - "end": 2079, + "end": 2078, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1087,9 +1087,9 @@ { "name": "pol", "start": 1871, - "end": 4883, + "end": 4882, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1099,9 +1099,9 @@ { "name": "vif", "start": 4827, - "end": 5406, + "end": 5405, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1111,9 +1111,9 @@ { "name": "vpr", "start": 5345, - "end": 5636, + "end": 5635, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1123,21 +1123,21 @@ { "name": "tat_exon1", "start": 5616, - "end": 5835, + "end": 5831, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5755, - "end": 5836, + "end": 5835, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -1147,9 +1147,9 @@ { "name": "vpu", "start": 5847, - "end": 6093, + "end": 6092, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1159,9 +1159,9 @@ { "name": "env", "start": 6010, - "end": 8551, + "end": 8550, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1171,9 +1171,9 @@ { "name": "tat_exon2", "start": 8132, - "end": 8228, + "end": 8227, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1183,9 +1183,9 @@ { "name": "rev_exon2", "start": 8133, - "end": 8409, + "end": 8408, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1195,9 +1195,9 @@ { "name": "nef", "start": 8552, - "end": 9167, + "end": 9166, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1209,9 +1209,9 @@ { "name": "gag", "start": 584, - "end": 2084, + "end": 2083, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1221,9 +1221,9 @@ { "name": "pol", "start": 1876, - "end": 4888, + "end": 4887, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1233,9 +1233,9 @@ { "name": "vif", "start": 4832, - "end": 5411, + "end": 5410, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1245,9 +1245,9 @@ { "name": "vpr", "start": 5350, - "end": 5641, + "end": 5640, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1257,9 +1257,9 @@ { "name": "tat_exon1", "start": 5621, - "end": 5840, + "end": 5839, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1269,21 +1269,21 @@ { "name": "rev_exon1", "start": 5760, - "end": 5841, + "end": 5837, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5852, - "end": 6098, + "end": 6097, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1293,9 +1293,9 @@ { "name": "env", "start": 6015, - "end": 8556, + "end": 8555, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1305,9 +1305,9 @@ { "name": "tat_exon2", "start": 8137, - "end": 8233, + "end": 8232, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1317,9 +1317,9 @@ { "name": "rev_exon2", "start": 8138, - "end": 8414, + "end": 8413, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1329,9 +1329,9 @@ { "name": "nef", "start": 8557, - "end": 9172, + "end": 9171, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1343,9 +1343,9 @@ { "name": "gag", "start": 707, - "end": 2207, + "end": 2206, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1355,9 +1355,9 @@ { "name": "pol", "start": 1999, - "end": 5011, + "end": 5010, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1367,9 +1367,9 @@ { "name": "vif", "start": 4955, - "end": 5534, + "end": 5533, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1379,9 +1379,9 @@ { "name": "vpr", "start": 5473, - "end": 5764, + "end": 5763, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1391,9 +1391,9 @@ { "name": "tat_exon1", "start": 5744, - "end": 5963, + "end": 5962, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1403,21 +1403,21 @@ { "name": "rev_exon1", "start": 5883, - "end": 5964, + "end": 5960, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5975, - "end": 6221, + "end": 6220, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1427,9 +1427,9 @@ { "name": "env", "start": 6138, - "end": 8679, + "end": 8678, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1439,9 +1439,9 @@ { "name": "tat_exon2", "start": 8260, - "end": 8356, + "end": 8355, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1451,9 +1451,9 @@ { "name": "rev_exon2", "start": 8261, - "end": 8537, + "end": 8536, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1463,9 +1463,9 @@ { "name": "nef", "start": 8680, - "end": 9295, + "end": 9294, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1477,9 +1477,9 @@ { "name": "gag", "start": 176, - "end": 1685, + "end": 1684, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27304152847199525, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", @@ -1489,9 +1489,9 @@ { "name": "pol", "start": 1477, - "end": 4489, + "end": 4488, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.26443159013103534, "protein": "FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -1501,9 +1501,9 @@ { "name": "vif", "start": 4433, - "end": 5012, + "end": 5011, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -1513,9 +1513,9 @@ { "name": "vpr", "start": 4951, - "end": 5242, + "end": 5241, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -1525,9 +1525,9 @@ { "name": "tat_exon1", "start": 5222, - "end": 5441, + "end": 5440, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -1537,21 +1537,21 @@ { "name": "rev_exon1", "start": 5361, - "end": 5442, + "end": 5438, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5453, - "end": 5699, + "end": 5698, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5682727709300466, "protein": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM", @@ -1561,9 +1561,9 @@ { "name": "env", "start": 5616, - "end": 8217, + "end": 8216, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5091484869809996, "protein": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -1573,9 +1573,9 @@ { "name": "tat_exon2", "start": 7798, - "end": 7891, + "end": 7890, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -1585,9 +1585,9 @@ { "name": "rev_exon2", "start": 7799, - "end": 8075, + "end": 8074, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -1597,9 +1597,9 @@ { "name": "nef", "start": 8218, - "end": 8860, + "end": 8859, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -1611,9 +1611,9 @@ { "name": "gag", "start": 663, - "end": 2163, + "end": 2162, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1623,9 +1623,9 @@ { "name": "pol", "start": 1955, - "end": 4967, + "end": 4966, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1635,9 +1635,9 @@ { "name": "vif", "start": 4911, - "end": 5490, + "end": 5489, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1647,9 +1647,9 @@ { "name": "vpr", "start": 5429, - "end": 5720, + "end": 5719, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1659,21 +1659,21 @@ { "name": "tat_exon1", "start": 5700, - "end": 5919, + "end": 5915, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5839, - "end": 5920, + "end": 5919, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -1683,9 +1683,9 @@ { "name": "vpu", "start": 5931, - "end": 6177, + "end": 6176, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1695,9 +1695,9 @@ { "name": "env", "start": 6094, - "end": 8635, + "end": 8634, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1707,9 +1707,9 @@ { "name": "tat_exon2", "start": 8216, - "end": 8312, + "end": 8311, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1719,9 +1719,9 @@ { "name": "rev_exon2", "start": 8217, - "end": 8493, + "end": 8492, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1731,9 +1731,9 @@ { "name": "nef", "start": 8636, - "end": 9251, + "end": 9250, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1745,9 +1745,9 @@ { "name": "gag", "start": 250, - "end": 1753, + "end": 1752, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.25132972351334526, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP", @@ -1757,9 +1757,9 @@ { "name": "pol", "start": 1545, - "end": 4557, + "end": 4556, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.2540106951871657, "protein": "FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED", @@ -1769,9 +1769,9 @@ { "name": "vif", "start": 4501, - "end": 5083, + "end": 5082, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.40472673559822736, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH", @@ -1781,9 +1781,9 @@ { "name": "vpr", "start": 5022, - "end": 5313, + "end": 5312, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3808935556928146, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -1793,9 +1793,9 @@ { "name": "tat_exon1", "start": 5293, - "end": 5512, + "end": 5511, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", @@ -1805,9 +1805,9 @@ { "name": "rev_exon1", "start": 5432, - "end": 5513, + "end": 5512, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELLRITRTIKFLYQNSE", @@ -1817,9 +1817,9 @@ { "name": "vpu", "start": 5524, - "end": 5794, + "end": 5793, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5776066350710902, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL", @@ -1829,9 +1829,9 @@ { "name": "env", "start": 5687, - "end": 8198, + "end": 8197, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.6638103647692366, "protein": "MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -1841,9 +1841,9 @@ { "name": "tat_exon2", "start": 7779, - "end": 7872, + "end": 7871, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -1853,9 +1853,9 @@ { "name": "rev_exon2", "start": 7780, - "end": 8056, + "end": 8055, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -1865,9 +1865,9 @@ { "name": "nef", "start": 8199, - "end": 8823, + "end": 8822, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5093153589821267, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -1879,9 +1879,9 @@ { "name": "gag", "start": 316, - "end": 1819, + "end": 1818, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.24298292552415257, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP", @@ -1891,9 +1891,9 @@ { "name": "pol", "start": 1611, - "end": 4623, + "end": 4622, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.25132972351334504, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", @@ -1903,9 +1903,9 @@ { "name": "vif", "start": 4567, - "end": 5149, + "end": 5148, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.42180774748923966, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH", @@ -1915,9 +1915,9 @@ { "name": "vpr", "start": 5088, - "end": 5379, + "end": 5378, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.36116422349691957, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -1927,9 +1927,9 @@ { "name": "tat_exon1", "start": 5359, - "end": 5578, + "end": 5577, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", @@ -1939,9 +1939,9 @@ { "name": "rev_exon1", "start": 5498, - "end": 5579, + "end": 5578, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5884955752212389, "protein": "MAGRSGDSDEELLKITRTIKFLYQNSE", @@ -1951,9 +1951,9 @@ { "name": "vpu", "start": 5590, - "end": 5860, + "end": 5859, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5680096940321115, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL", @@ -1963,9 +1963,9 @@ { "name": "env", "start": 5753, - "end": 8315, + "end": 8314, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4938011995318903, "protein": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -1975,9 +1975,9 @@ { "name": "tat_exon2", "start": 7896, - "end": 7989, + "end": 7988, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -1987,9 +1987,9 @@ { "name": "rev_exon2", "start": 7897, - "end": 8173, + "end": 8172, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.44369946756063905, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -1999,9 +1999,9 @@ { "name": "nef", "start": 8316, - "end": 8940, + "end": 8939, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5036770338593534, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -2013,9 +2013,9 @@ { "name": "gag", "start": 532, - "end": 2047, + "end": 2046, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27270615563298484, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ", @@ -2025,9 +2025,9 @@ { "name": "pol", "start": 1839, - "end": 4851, + "end": 4850, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.21944123990570308, "protein": "FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2037,9 +2037,9 @@ { "name": "vif", "start": 4795, - "end": 5374, + "end": 5373, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH", @@ -2049,9 +2049,9 @@ { "name": "vpr", "start": 5313, - "end": 5598, + "end": 5597, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.39401343921808174, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS", @@ -2061,9 +2061,9 @@ { "name": "tat_exon1", "start": 5578, - "end": 5797, + "end": 5796, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.5138258357408172, "protein": "MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ", @@ -2073,9 +2073,9 @@ { "name": "rev_exon1", "start": 5717, - "end": 5798, + "end": 5797, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5940834141610087, "protein": "MAGRSGDRDEDLLETVRFIKFLYQNSK", @@ -2085,9 +2085,9 @@ { "name": "vpu", "start": 5809, - "end": 6055, + "end": 6054, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5727186311787074, "protein": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL", @@ -2097,9 +2097,9 @@ { "name": "env", "start": 5972, - "end": 8549, + "end": 8548, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5021538905210794, "protein": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL", @@ -2109,9 +2109,9 @@ { "name": "tat_exon2", "start": 8130, - "end": 8226, + "end": 8225, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6074396517609815, "protein": "RPPAQPQGDPTGPKKSKKEVEKETETDQCD", @@ -2121,9 +2121,9 @@ { "name": "rev_exon2", "start": 8131, - "end": 8407, + "end": 8406, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.47688921496698455, "protein": "DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE", @@ -2133,9 +2133,9 @@ { "name": "nef", "start": 8550, - "end": 8985, + "end": 8984, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.6017710152157637, "protein": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK", @@ -2147,9 +2147,9 @@ { "name": "gag", "start": 120, - "end": 2022, + "end": 2021, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7511039743075072, "protein": "MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC", @@ -2159,9 +2159,9 @@ { "name": "pol", "start": 1787, - "end": 4826, + "end": 4825, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7637180771917039, "protein": "ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI", @@ -2171,9 +2171,9 @@ { "name": "vif", "start": 4425, - "end": 5349, + "end": 5348, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7566838361540349, "protein": "MIVWQVDRMKIRTWKSLVKYHMYISKKAKK", @@ -2183,9 +2183,9 @@ { "name": "vpr", "start": 5033, - "end": 5579, + "end": 5578, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.7334692430420138, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", @@ -2195,21 +2195,21 @@ { "name": "tat_exon1", "start": 5486, - "end": 5780, + "end": 5776, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7619181418001311, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", - "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN", - "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT" + "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAV", + "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTA" }, { "name": "rev_exon1", "start": 5698, - "end": 5779, + "end": 5778, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", @@ -2219,9 +2219,9 @@ { "name": "vpu", "start": 5790, - "end": 6039, + "end": 6038, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7407973896196594, "protein": "MQPLKILAIVALVVAAIIAIVV", @@ -2231,9 +2231,9 @@ { "name": "env", "start": 5953, - "end": 8521, + "end": 8520, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7529994904340572, "protein": "MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD", @@ -2243,9 +2243,9 @@ { "name": "nef", "start": 7916, - "end": 9176, + "end": 9175, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7587548638132295, "protein": "MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", @@ -2255,9 +2255,9 @@ { "name": "tat_exon2", "start": 8102, - "end": 8198, + "end": 8197, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.7134052388289676, "protein": "RPSSQPQEDQTGPKE", @@ -2267,9 +2267,9 @@ { "name": "rev_exon2", "start": 8103, - "end": 8379, + "end": 8378, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6888374145157732, "protein": "ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE", @@ -2281,9 +2281,9 @@ { "name": "gag", "start": 302, - "end": 1715, + "end": 1714, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7484174646972894, "protein": "MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC", @@ -2293,9 +2293,9 @@ { "name": "pol", "start": 1613, - "end": 4625, + "end": 4624, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7535201229073285, "protein": "AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED", @@ -2305,9 +2305,9 @@ { "name": "vif", "start": 4289, - "end": 4988, + "end": 4987, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7624714704923379, "protein": "MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED", @@ -2317,9 +2317,9 @@ { "name": "vpr", "start": 5087, - "end": 5378, + "end": 5377, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.6737199868435482, "protein": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT", @@ -2329,21 +2329,21 @@ { "name": "tat_exon1", "start": 5235, - "end": 5577, + "end": 5573, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.6325105553751218, "protein": "MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", - "aminoacids": "MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ*", - "nucleotides": "ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA" + "aminoacids": "MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", + "nucleotides": "ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG" }, { "name": "rev_exon1", "start": 5497, - "end": 5578, + "end": 5577, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSRDSDEELLTAVRIIKRLYQSSK", @@ -2353,9 +2353,9 @@ { "name": "vpu", "start": 5589, - "end": 5835, + "end": 5834, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.6256860592755216, "protein": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP", @@ -2365,9 +2365,9 @@ { "name": "env", "start": 5752, - "end": 8353, + "end": 8352, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7518870380010406, "protein": "MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD", @@ -2377,9 +2377,9 @@ { "name": "nef", "start": 7748, - "end": 8996, + "end": 8995, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7328145265888457, "protein": "MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR", @@ -2389,9 +2389,9 @@ { "name": "tat_exon2", "start": 7934, - "end": 8027, + "end": 8026, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5633802816901408, "protein": "RPSSQPREDPTGPKEQKKEVERKTEAHPRD", @@ -2401,9 +2401,9 @@ { "name": "rev_exon2", "start": 7935, - "end": 8211, + "end": 8210, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6781884553958476, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE", @@ -2415,9 +2415,9 @@ { "name": "gag", "start": 292, - "end": 1795, + "end": 1794, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.25442849599155104, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", @@ -2427,9 +2427,9 @@ { "name": "pol", "start": 1587, - "end": 4599, + "end": 4598, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.17509882471546434, "protein": "FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2439,9 +2439,9 @@ { "name": "vif", "start": 4543, - "end": 5122, + "end": 5121, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.34158090650317496, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH", @@ -2451,9 +2451,9 @@ { "name": "vpr", "start": 5061, - "end": 5352, + "end": 5351, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", @@ -2463,9 +2463,9 @@ { "name": "tat_exon1", "start": 5332, - "end": 5551, + "end": 5550, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ", @@ -2475,9 +2475,9 @@ { "name": "rev_exon1", "start": 5471, - "end": 5552, + "end": 5551, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", @@ -2487,9 +2487,9 @@ { "name": "vpu", "start": 5563, - "end": 5809, + "end": 5808, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5560235888795282, "protein": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL", @@ -2499,9 +2499,9 @@ { "name": "env", "start": 5726, - "end": 8288, + "end": 8287, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5276672448389619, "protein": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL", @@ -2511,9 +2511,9 @@ { "name": "tat_exon2", "start": 7869, - "end": 7965, + "end": 7964, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQLRGEPTGPKE", @@ -2523,9 +2523,9 @@ { "name": "rev_exon2", "start": 7870, - "end": 8146, + "end": 8145, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.32366339007432277, "protein": "DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE", @@ -2535,9 +2535,9 @@ { "name": "nef", "start": 8289, - "end": 8940, + "end": 8939, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4631394979345408, "protein": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", @@ -2549,9 +2549,9 @@ { "name": "gag", "start": 521, - "end": 2021, + "end": 2020, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -2561,9 +2561,9 @@ { "name": "pol", "start": 1813, - "end": 4825, + "end": 4824, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2573,9 +2573,9 @@ { "name": "vif", "start": 4769, - "end": 5348, + "end": 5347, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -2585,9 +2585,9 @@ { "name": "vpr", "start": 5287, - "end": 5578, + "end": 5577, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -2597,9 +2597,9 @@ { "name": "tat_exon1", "start": 5558, - "end": 5777, + "end": 5776, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2609,21 +2609,21 @@ { "name": "rev_exon1", "start": 5697, - "end": 5778, + "end": 5774, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5789, - "end": 6035, + "end": 6034, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -2633,9 +2633,9 @@ { "name": "env", "start": 5952, - "end": 8493, + "end": 8492, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -2645,9 +2645,9 @@ { "name": "tat_exon2", "start": 8074, - "end": 8170, + "end": 8169, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2657,9 +2657,9 @@ { "name": "rev_exon2", "start": 8075, - "end": 8351, + "end": 8350, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2669,9 +2669,9 @@ { "name": "nef", "start": 8494, - "end": 9109, + "end": 9108, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -2683,9 +2683,9 @@ { "name": "gag", "start": 488, - "end": 1601, + "end": 1600, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7372881355932204, "protein": "MSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ", @@ -2695,9 +2695,9 @@ { "name": "pol", "start": 1393, - "end": 4405, + "end": 4404, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.2413273001508296, "protein": "FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED", @@ -2707,9 +2707,9 @@ { "name": "vif", "start": 4349, - "end": 4928, + "end": 4927, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.41532297468972923, "protein": "MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH", @@ -2719,9 +2719,9 @@ { "name": "vpr", "start": 4867, - "end": 5158, + "end": 5157, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.4489646325820048, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP", @@ -2731,9 +2731,9 @@ { "name": "tat_exon1", "start": 5138, - "end": 5357, + "end": 5356, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.5243736647892796, "protein": "MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ", @@ -2743,21 +2743,21 @@ { "name": "rev_exon1", "start": 5277, - "end": 5358, + "end": 5354, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.524971623155505, - "protein": "MAGRSGDSDEDLLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEDLLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAAG" + "distance": 0.48200514138817474, + "protein": "MAGRSGDSDEDLLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEDLLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 5369, - "end": 5615, + "end": 5614, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5568484042553192, "protein": "MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL", @@ -2767,9 +2767,9 @@ { "name": "env", "start": 5532, - "end": 8073, + "end": 8072, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.48179770175870373, "protein": "MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL", @@ -2779,9 +2779,9 @@ { "name": "tat_exon2", "start": 7654, - "end": 7750, + "end": 7749, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPASQPRGDPTGPKESKKTVERETETDPHA", @@ -2791,9 +2791,9 @@ { "name": "rev_exon2", "start": 7655, - "end": 7940, + "end": 7939, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.46126825660935467, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC", @@ -2803,9 +2803,9 @@ { "name": "nef", "start": 8074, - "end": 8695, + "end": 8694, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.48762337458875116, "protein": "MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC", @@ -2817,9 +2817,9 @@ { "name": "gag", "start": 683, - "end": 2183, + "end": 2182, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -2829,9 +2829,9 @@ { "name": "pol", "start": 1975, - "end": 4987, + "end": 4986, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2841,9 +2841,9 @@ { "name": "vif", "start": 4931, - "end": 5510, + "end": 5509, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -2853,9 +2853,9 @@ { "name": "vpr", "start": 5449, - "end": 5740, + "end": 5739, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -2865,9 +2865,9 @@ { "name": "tat_exon1", "start": 5720, - "end": 5939, + "end": 5938, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2877,21 +2877,21 @@ { "name": "rev_exon1", "start": 5859, - "end": 5940, + "end": 5936, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5951, - "end": 6197, + "end": 6196, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -2901,9 +2901,9 @@ { "name": "env", "start": 6114, - "end": 8655, + "end": 8654, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -2913,9 +2913,9 @@ { "name": "tat_exon2", "start": 8236, - "end": 8332, + "end": 8331, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2925,9 +2925,9 @@ { "name": "rev_exon2", "start": 8237, - "end": 8513, + "end": 8512, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2937,9 +2937,9 @@ { "name": "nef", "start": 8656, - "end": 9271, + "end": 9270, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -2951,9 +2951,9 @@ { "name": "gag", "start": 210, - "end": 1719, + "end": 1718, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27936962750716343, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP", @@ -2963,9 +2963,9 @@ { "name": "pol", "start": 1511, - "end": 4523, + "end": 4522, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.26443159013103534, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -2975,9 +2975,9 @@ { "name": "vif", "start": 4467, - "end": 5046, + "end": 5045, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -2987,9 +2987,9 @@ { "name": "env", "start": 4985, - "end": 8207, + "end": 8206, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.6657028690558922, "protein": "MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -2999,9 +2999,9 @@ { "name": "vpr", "start": 4985, - "end": 5276, + "end": 5275, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3120665742024965, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -3011,21 +3011,21 @@ { "name": "tat_exon1", "start": 5256, - "end": 5475, + "end": 5471, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", - "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA" + "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG" }, { "name": "rev_exon1", "start": 5395, - "end": 5476, + "end": 5475, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", @@ -3035,9 +3035,9 @@ { "name": "vpu", "start": 5487, - "end": 5733, + "end": 5732, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5568484042553192, "protein": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", @@ -3047,9 +3047,9 @@ { "name": "tat_exon2", "start": 7788, - "end": 7881, + "end": 7880, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3059,9 +3059,9 @@ { "name": "rev_exon2", "start": 7789, - "end": 8065, + "end": 8064, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3071,9 +3071,9 @@ { "name": "nef", "start": 8208, - "end": 8850, + "end": 8849, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC", @@ -3085,9 +3085,9 @@ { "name": "gag", "start": 739, - "end": 2239, + "end": 2238, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3097,9 +3097,9 @@ { "name": "pol", "start": 2031, - "end": 5043, + "end": 5042, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3109,9 +3109,9 @@ { "name": "vif", "start": 4987, - "end": 5566, + "end": 5565, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3121,9 +3121,9 @@ { "name": "vpr", "start": 5505, - "end": 5796, + "end": 5795, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3133,9 +3133,9 @@ { "name": "tat_exon1", "start": 5776, - "end": 5995, + "end": 5994, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3145,9 +3145,9 @@ { "name": "rev_exon1", "start": 5915, - "end": 5996, + "end": 5995, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3157,9 +3157,9 @@ { "name": "vpu", "start": 6007, - "end": 6253, + "end": 6252, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3169,9 +3169,9 @@ { "name": "env", "start": 6170, - "end": 8711, + "end": 8710, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3181,9 +3181,9 @@ { "name": "tat_exon2", "start": 8292, - "end": 8388, + "end": 8387, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3193,9 +3193,9 @@ { "name": "rev_exon2", "start": 8293, - "end": 8569, + "end": 8568, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3205,9 +3205,9 @@ { "name": "nef", "start": 8712, - "end": 9327, + "end": 9326, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3219,9 +3219,9 @@ { "name": "gag", "start": 221, - "end": 1730, + "end": 1729, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2880084183556756, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", @@ -3231,9 +3231,9 @@ { "name": "pol", "start": 1522, - "end": 4534, + "end": 4533, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.25117173416656646, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -3243,9 +3243,9 @@ { "name": "vif", "start": 4478, - "end": 5057, + "end": 5056, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -3255,9 +3255,9 @@ { "name": "vpr", "start": 4996, - "end": 5287, + "end": 5286, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3351206434316354, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -3267,9 +3267,9 @@ { "name": "tat_exon1", "start": 5267, - "end": 5486, + "end": 5485, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -3279,21 +3279,21 @@ { "name": "rev_exon1", "start": 5406, - "end": 5487, + "end": 5483, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5498, - "end": 5744, + "end": 5743, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5568484042553192, "protein": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", @@ -3303,9 +3303,9 @@ { "name": "env", "start": 5661, - "end": 8262, + "end": 8261, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5052314240113498, "protein": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -3315,9 +3315,9 @@ { "name": "tat_exon2", "start": 7843, - "end": 7936, + "end": 7935, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3327,9 +3327,9 @@ { "name": "rev_exon2", "start": 7844, - "end": 8120, + "end": 8119, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3339,9 +3339,9 @@ { "name": "nef", "start": 8263, - "end": 8905, + "end": 8904, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5339772804571117, "protein": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -3353,9 +3353,9 @@ { "name": "gag", "start": 527, - "end": 2297, + "end": 2296, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.706855791962175, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", @@ -3365,9 +3365,9 @@ { "name": "pol", "start": 2089, - "end": 5101, + "end": 5100, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7518376924488996, "protein": "AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED", @@ -3377,9 +3377,9 @@ { "name": "vif", "start": 5045, - "end": 5624, + "end": 5623, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7067546928117459, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY", @@ -3389,9 +3389,9 @@ { "name": "vpr", "start": 5563, - "end": 5854, + "end": 5853, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", @@ -3401,9 +3401,9 @@ { "name": "tat_exon1", "start": 5563, - "end": 6052, + "end": 6051, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7571801566579635, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", @@ -3413,21 +3413,21 @@ { "name": "rev_exon1", "start": 5973, - "end": 6054, + "end": 6050, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", - "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSS", + "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 6065, - "end": 6311, + "end": 6310, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7521692502681095, "protein": "MQSLYILTIVALVVAAILAIVV", @@ -3437,9 +3437,9 @@ { "name": "env", "start": 6228, - "end": 8799, + "end": 8798, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7471048806788873, "protein": "MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST", @@ -3449,9 +3449,9 @@ { "name": "nef", "start": 8194, - "end": 9451, + "end": 9450, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.6514772974147296, "protein": "MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", @@ -3461,9 +3461,9 @@ { "name": "tat_exon2", "start": 8380, - "end": 8476, + "end": 8475, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQPREEPTGPKE", @@ -3473,9 +3473,9 @@ { "name": "rev_exon2", "start": 8381, - "end": 8657, + "end": 8656, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.5716671727907683, "protein": "RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE", @@ -3487,9 +3487,9 @@ { "name": "gag", "start": 746, - "end": 2246, + "end": 2245, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3499,9 +3499,9 @@ { "name": "pol", "start": 2038, - "end": 5050, + "end": 5049, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3511,9 +3511,9 @@ { "name": "vif", "start": 4994, - "end": 5573, + "end": 5572, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3523,9 +3523,9 @@ { "name": "vpr", "start": 5512, - "end": 5803, + "end": 5802, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3535,9 +3535,9 @@ { "name": "tat_exon1", "start": 5783, - "end": 6002, + "end": 6001, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3547,21 +3547,21 @@ { "name": "rev_exon1", "start": 5922, - "end": 6003, + "end": 5999, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 6014, - "end": 6260, + "end": 6259, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3571,9 +3571,9 @@ { "name": "env", "start": 6177, - "end": 8718, + "end": 8717, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3583,9 +3583,9 @@ { "name": "tat_exon2", "start": 8299, - "end": 8395, + "end": 8394, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3595,9 +3595,9 @@ { "name": "rev_exon2", "start": 8300, - "end": 8576, + "end": 8575, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3607,9 +3607,9 @@ { "name": "nef", "start": 8719, - "end": 9334, + "end": 9333, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3621,9 +3621,9 @@ { "name": "gag", "start": 695, - "end": 2195, + "end": 2194, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3633,9 +3633,9 @@ { "name": "pol", "start": 1986, - "end": 5004, + "end": 5003, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.6033592883813991, "protein": "YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3645,9 +3645,9 @@ { "name": "vif", "start": 4948, - "end": 5527, + "end": 5526, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3657,9 +3657,9 @@ { "name": "vpr", "start": 5466, - "end": 5757, + "end": 5756, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3669,9 +3669,9 @@ { "name": "tat_exon1", "start": 5737, - "end": 5956, + "end": 5955, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3681,9 +3681,9 @@ { "name": "rev_exon1", "start": 5876, - "end": 5957, + "end": 5956, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3693,9 +3693,9 @@ { "name": "vpu", "start": 5968, - "end": 6214, + "end": 6213, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3705,9 +3705,9 @@ { "name": "env", "start": 6131, - "end": 8672, + "end": 8671, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3717,9 +3717,9 @@ { "name": "tat_exon2", "start": 8253, - "end": 8349, + "end": 8348, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3729,9 +3729,9 @@ { "name": "rev_exon2", "start": 8254, - "end": 8530, + "end": 8529, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3741,9 +3741,9 @@ { "name": "nef", "start": 8673, - "end": 9288, + "end": 9287, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3755,9 +3755,9 @@ { "name": "gag", "start": 817, - "end": 2317, + "end": 2316, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3767,9 +3767,9 @@ { "name": "pol", "start": 2109, - "end": 5121, + "end": 5120, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3779,9 +3779,9 @@ { "name": "vif", "start": 5065, - "end": 5644, + "end": 5643, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3791,9 +3791,9 @@ { "name": "vpr", "start": 5583, - "end": 5874, + "end": 5873, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3803,9 +3803,9 @@ { "name": "tat_exon1", "start": 5854, - "end": 6073, + "end": 6072, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3815,9 +3815,9 @@ { "name": "rev_exon1", "start": 5993, - "end": 6074, + "end": 6073, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3827,9 +3827,9 @@ { "name": "vpu", "start": 6085, - "end": 6331, + "end": 6330, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3839,9 +3839,9 @@ { "name": "env", "start": 6248, - "end": 8789, + "end": 8788, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3851,9 +3851,9 @@ { "name": "tat_exon2", "start": 8370, - "end": 8466, + "end": 8465, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3863,9 +3863,9 @@ { "name": "rev_exon2", "start": 8371, - "end": 8647, + "end": 8646, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3875,9 +3875,9 @@ { "name": "nef", "start": 8790, - "end": 9405, + "end": 9404, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3889,9 +3889,9 @@ { "name": "gag", "start": 687, - "end": 2187, + "end": 2186, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2967573174581697, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3901,9 +3901,9 @@ { "name": "pol", "start": 1979, - "end": 4991, + "end": 4990, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3913,9 +3913,9 @@ { "name": "vif", "start": 4935, - "end": 5514, + "end": 5513, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3925,9 +3925,9 @@ { "name": "vpr", "start": 5453, - "end": 5744, + "end": 5743, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3937,21 +3937,21 @@ { "name": "tat_exon1", "start": 5724, - "end": 5943, + "end": 5939, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5863, - "end": 5944, + "end": 5943, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3961,9 +3961,9 @@ { "name": "vpu", "start": 5955, - "end": 6201, + "end": 6200, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3973,9 +3973,9 @@ { "name": "env", "start": 6118, - "end": 8659, + "end": 8658, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4620723847297967, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3985,9 +3985,9 @@ { "name": "tat_exon2", "start": 8240, - "end": 8336, + "end": 8335, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3997,9 +3997,9 @@ { "name": "rev_exon2", "start": 8241, - "end": 8517, + "end": 8516, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4009,9 +4009,9 @@ { "name": "nef", "start": 8660, - "end": 9275, + "end": 9274, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4023,9 +4023,9 @@ { "name": "gag", "start": 555, - "end": 2055, + "end": 2054, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4035,9 +4035,9 @@ { "name": "pol", "start": 1847, - "end": 4859, + "end": 4858, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4047,9 +4047,9 @@ { "name": "vif", "start": 4803, - "end": 5382, + "end": 5381, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4059,9 +4059,9 @@ { "name": "vpr", "start": 5321, - "end": 5612, + "end": 5611, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4071,21 +4071,21 @@ { "name": "tat_exon1", "start": 5592, - "end": 5811, + "end": 5807, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5731, - "end": 5812, + "end": 5811, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4095,9 +4095,9 @@ { "name": "vpu", "start": 5823, - "end": 6069, + "end": 6068, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4107,9 +4107,9 @@ { "name": "env", "start": 5986, - "end": 8527, + "end": 8526, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4119,9 +4119,9 @@ { "name": "tat_exon2", "start": 8108, - "end": 8204, + "end": 8203, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4131,9 +4131,9 @@ { "name": "rev_exon2", "start": 8109, - "end": 8385, + "end": 8384, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4143,9 +4143,9 @@ { "name": "nef", "start": 8528, - "end": 9143, + "end": 9142, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4157,9 +4157,9 @@ { "name": "gag", "start": 246, - "end": 1782, + "end": 1781, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.35613851839948674, "protein": "MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ", @@ -4169,9 +4169,9 @@ { "name": "pol", "start": 1544, - "end": 4586, + "end": 4585, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.24526399193257942, "protein": "FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4181,9 +4181,9 @@ { "name": "vif", "start": 4530, - "end": 5109, + "end": 5108, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4193,9 +4193,9 @@ { "name": "vpr", "start": 5048, - "end": 5339, + "end": 5338, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS", @@ -4205,21 +4205,21 @@ { "name": "tat_exon1", "start": 5319, - "end": 5538, + "end": 5534, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.5237430167597767, "protein": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", - "aminoacids": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ*", - "nucleotides": "ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAA" + "aminoacids": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", + "nucleotides": "ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5458, - "end": 5539, + "end": 5538, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5622384937238494, "protein": "MAGRSGDGDEDLLKAVRLIKTLYQSSK", @@ -4229,9 +4229,9 @@ { "name": "vpu", "start": 5550, - "end": 5808, + "end": 5807, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.6039004707464695, "protein": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND", @@ -4241,9 +4241,9 @@ { "name": "env", "start": 5716, - "end": 8257, + "end": 8256, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5196110433453024, "protein": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE", @@ -4253,9 +4253,9 @@ { "name": "tat_exon2", "start": 7874, - "end": 7970, + "end": 7969, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPASQSRGDPTGPKEPKKKVERETETDPTD", @@ -4265,9 +4265,9 @@ { "name": "rev_exon2", "start": 7875, - "end": 8151, + "end": 8150, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE", @@ -4277,9 +4277,9 @@ { "name": "nef", "start": 8275, - "end": 8896, + "end": 8895, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4680383864671438, "protein": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC", @@ -4291,9 +4291,9 @@ { "name": "gag", "start": 2, - "end": 1697, + "end": 1696, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7478034493979825, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC", @@ -4303,9 +4303,9 @@ { "name": "pol", "start": 1489, - "end": 4501, + "end": 4500, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7624366800883231, "protein": "KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK", @@ -4315,9 +4315,9 @@ { "name": "vif", "start": 4445, - "end": 5024, + "end": 5023, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7494633160752622, "protein": "MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR", @@ -4327,9 +4327,9 @@ { "name": "vpr", "start": 4963, - "end": 5254, + "end": 5253, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.4464285714285715, "protein": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS", @@ -4339,9 +4339,9 @@ { "name": "tat_exon1", "start": 5111, - "end": 5453, + "end": 5452, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.6409453748630458, "protein": "MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ", @@ -4351,21 +4351,21 @@ { "name": "rev_exon1", "start": 5373, - "end": 5454, + "end": 5450, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5465, - "end": 5711, + "end": 5710, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7521692502681095, "protein": "MHALEIAAIVRLVVAAIIAIVV", @@ -4375,9 +4375,9 @@ { "name": "env", "start": 5628, - "end": 8229, + "end": 8228, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7513561129398668, "protein": "MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD", @@ -4387,9 +4387,9 @@ { "name": "nef", "start": 7624, - "end": 8872, + "end": 8871, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5833488893037148, "protein": "MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -4399,9 +4399,9 @@ { "name": "tat_exon2", "start": 7810, - "end": 7903, + "end": 7902, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RPSSQPRGDPTGPKEQKKEVERKTEAHPRD", @@ -4411,9 +4411,9 @@ { "name": "rev_exon2", "start": 7811, - "end": 8087, + "end": 8086, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6667847862036381, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE", @@ -4425,9 +4425,9 @@ { "name": "gag", "start": 549, - "end": 2049, + "end": 2048, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4437,9 +4437,9 @@ { "name": "pol", "start": 1841, - "end": 4853, + "end": 4852, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4449,9 +4449,9 @@ { "name": "vif", "start": 4797, - "end": 5376, + "end": 5375, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4461,9 +4461,9 @@ { "name": "vpr", "start": 5315, - "end": 5606, + "end": 5605, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4473,21 +4473,21 @@ { "name": "tat_exon1", "start": 5586, - "end": 5805, + "end": 5801, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5725, - "end": 5806, + "end": 5805, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4497,9 +4497,9 @@ { "name": "vpu", "start": 5817, - "end": 6063, + "end": 6062, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4509,9 +4509,9 @@ { "name": "env", "start": 5980, - "end": 8521, + "end": 8520, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4521,9 +4521,9 @@ { "name": "tat_exon2", "start": 8102, - "end": 8198, + "end": 8197, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4533,9 +4533,9 @@ { "name": "rev_exon2", "start": 8103, - "end": 8379, + "end": 8378, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4545,9 +4545,9 @@ { "name": "nef", "start": 8522, - "end": 9137, + "end": 9136, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4559,9 +4559,9 @@ { "name": "gag", "start": 468, - "end": 1968, + "end": 1967, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4571,9 +4571,9 @@ { "name": "pol", "start": 1760, - "end": 4772, + "end": 4771, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4583,9 +4583,9 @@ { "name": "vif", "start": 4716, - "end": 5295, + "end": 5294, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4595,9 +4595,9 @@ { "name": "vpr", "start": 5234, - "end": 5525, + "end": 5524, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4607,21 +4607,21 @@ { "name": "tat_exon1", "start": 5505, - "end": 5724, + "end": 5720, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5644, - "end": 5725, + "end": 5724, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4631,9 +4631,9 @@ { "name": "vpu", "start": 5736, - "end": 5982, + "end": 5981, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4643,9 +4643,9 @@ { "name": "env", "start": 5899, - "end": 8440, + "end": 8439, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4655,9 +4655,9 @@ { "name": "tat_exon2", "start": 8021, - "end": 8117, + "end": 8116, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4667,9 +4667,9 @@ { "name": "rev_exon2", "start": 8022, - "end": 8298, + "end": 8297, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4679,9 +4679,9 @@ { "name": "nef", "start": 8441, - "end": 9056, + "end": 9055, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4693,9 +4693,9 @@ { "name": "gag", "start": 825, - "end": 2361, + "end": 2360, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2559303794507086, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ", @@ -4705,9 +4705,9 @@ { "name": "pol", "start": 2147, - "end": 5165, + "end": 5164, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19193360134872262, "protein": "FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4717,9 +4717,9 @@ { "name": "vif", "start": 5109, - "end": 5688, + "end": 5687, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.24677296886864086, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4729,9 +4729,9 @@ { "name": "vpr", "start": 5627, - "end": 5918, + "end": 5917, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -4741,21 +4741,21 @@ { "name": "tat_exon1", "start": 5898, - "end": 6117, + "end": 6113, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAG" }, { "name": "rev_exon1", "start": 6037, - "end": 6118, + "end": 6117, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDDELLKTVRLIKVLYQSSK", @@ -4765,9 +4765,9 @@ { "name": "vpu", "start": 6129, - "end": 6375, + "end": 6374, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5077548005908421, "protein": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL", @@ -4777,9 +4777,9 @@ { "name": "env", "start": 6292, - "end": 8875, + "end": 8874, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.48559709145147756, "protein": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL", @@ -4789,9 +4789,9 @@ { "name": "tat_exon2", "start": 8456, - "end": 8552, + "end": 8551, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RSTPQLRGDPTGPKESKEKVERETETDPVH", @@ -4801,9 +4801,9 @@ { "name": "rev_exon2", "start": 8457, - "end": 8733, + "end": 8732, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3690449563855961, "protein": "DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE", @@ -4813,9 +4813,9 @@ { "name": "nef", "start": 8876, - "end": 9509, + "end": 9508, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.411658382286489, "protein": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC", @@ -4827,9 +4827,9 @@ { "name": "gag", "start": 801, - "end": 2313, + "end": 2312, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.23466145196773402, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ", @@ -4839,9 +4839,9 @@ { "name": "pol", "start": 2105, - "end": 5117, + "end": 5116, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.15051124744376299, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4851,9 +4851,9 @@ { "name": "vif", "start": 5061, - "end": 5640, + "end": 5639, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3120665742024965, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4863,9 +4863,9 @@ { "name": "vpr", "start": 5579, - "end": 5870, + "end": 5869, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.34013605442176864, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS", @@ -4875,21 +4875,21 @@ { "name": "tat_exon1", "start": 5850, - "end": 6069, + "end": 6065, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.2515090543259557, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*", - "nucleotides": "ATGGAACCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", + "nucleotides": "ATGGAACCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5989, - "end": 6070, + "end": 6069, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.27969018932874357, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSSK", @@ -4899,9 +4899,9 @@ { "name": "vpu", "start": 6081, - "end": 6330, + "end": 6329, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.4674390731122653, "protein": "MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", @@ -4911,9 +4911,9 @@ { "name": "env", "start": 6244, - "end": 8827, + "end": 8826, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4447986679391638, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL", @@ -4923,9 +4923,9 @@ { "name": "tat_exon2", "start": 8408, - "end": 8504, + "end": 8503, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4971219256933542, "protein": "RPTPQPRGDPTGQKESEKKVERETETDPDH", @@ -4935,9 +4935,9 @@ { "name": "rev_exon2", "start": 8409, - "end": 8685, + "end": 8684, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", @@ -4947,9 +4947,9 @@ { "name": "nef", "start": 8828, - "end": 9461, + "end": 9460, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3499750374438344, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -4961,9 +4961,9 @@ { "name": "gag", "start": 855, - "end": 2358, + "end": 2357, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.24608716590416602, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -4973,9 +4973,9 @@ { "name": "pol", "start": 2150, - "end": 5162, + "end": 5161, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1574036511156186, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4985,9 +4985,9 @@ { "name": "vif", "start": 5106, - "end": 5685, + "end": 5684, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.34607778510217535, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4997,9 +4997,9 @@ { "name": "vpr", "start": 5624, - "end": 5915, + "end": 5914, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2936340145642471, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS", @@ -5009,21 +5009,21 @@ { "name": "tat_exon1", "start": 5895, - "end": 6114, + "end": 6110, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.2515090543259557, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGATTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCTCTTGTTATTGTAAGCAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCATCAAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 6034, - "end": 6115, + "end": 6114, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.27969018932874357, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSSK", @@ -5033,9 +5033,9 @@ { "name": "vpu", "start": 6126, - "end": 6375, + "end": 6374, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.4993502877297198, "protein": "MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", @@ -5045,9 +5045,9 @@ { "name": "env", "start": 6289, - "end": 8881, + "end": 8880, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4503018671784417, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", @@ -5057,9 +5057,9 @@ { "name": "tat_exon2", "start": 8462, - "end": 8558, + "end": 8557, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4542873367404884, "protein": "RPTSQPRGDPTGQKESKEKVERETETDPDH", @@ -5069,9 +5069,9 @@ { "name": "rev_exon2", "start": 8463, - "end": 8739, + "end": 8738, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", @@ -5081,9 +5081,9 @@ { "name": "nef", "start": 8882, - "end": 9515, + "end": 9514, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3499750374438344, "protein": "MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -5095,9 +5095,9 @@ { "name": "gag", "start": 767, - "end": 2270, + "end": 2269, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.316486214000789, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ", @@ -5107,9 +5107,9 @@ { "name": "pol", "start": 2062, - "end": 5074, + "end": 5073, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1943357603710517, "protein": "FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5119,9 +5119,9 @@ { "name": "vif", "start": 5018, - "end": 5597, + "end": 5596, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH", @@ -5131,9 +5131,9 @@ { "name": "vpr", "start": 5536, - "end": 5827, + "end": 5826, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS", @@ -5143,9 +5143,9 @@ { "name": "tat_exon1", "start": 5807, - "end": 6026, + "end": 6025, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ", @@ -5155,21 +5155,21 @@ { "name": "rev_exon1", "start": 5946, - "end": 6027, + "end": 6023, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKFLYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKFLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKFLYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKFLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 6038, - "end": 6284, + "end": 6283, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5464940306036659, "protein": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL", @@ -5179,9 +5179,9 @@ { "name": "env", "start": 6201, - "end": 8778, + "end": 8777, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5083167934238491, "protein": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL", @@ -5191,9 +5191,9 @@ { "name": "tat_exon2", "start": 8359, - "end": 8455, + "end": 8454, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4034761018001243, "protein": "RPASQPRGDPTGPKEPTKKVERETETDPDH", @@ -5203,9 +5203,9 @@ { "name": "rev_exon2", "start": 8360, - "end": 8636, + "end": 8635, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE", @@ -5215,9 +5215,9 @@ { "name": "nef", "start": 8779, - "end": 9406, + "end": 9405, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5049429657794677, "protein": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC", @@ -5229,9 +5229,9 @@ { "name": "gag", "start": 773, - "end": 2276, + "end": 2275, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.22891685660489547, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ", @@ -5241,9 +5241,9 @@ { "name": "pol", "start": 2068, - "end": 5080, + "end": 5079, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1363825363825364, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5253,9 +5253,9 @@ { "name": "vif", "start": 5024, - "end": 5603, + "end": 5602, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.27432333577176293, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -5265,9 +5265,9 @@ { "name": "vpr", "start": 5542, - "end": 5833, + "end": 5832, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2678354029705382, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS", @@ -5277,9 +5277,9 @@ { "name": "tat_exon1", "start": 5813, - "end": 6032, + "end": 6031, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.31992687385740404, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ", @@ -5289,21 +5289,21 @@ { "name": "rev_exon1", "start": 5952, - "end": 6033, + "end": 6029, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.3620426829268293, - "protein": "MAGRSGDSDEELLQTVRLIKLLYQSSK", - "aminoacids": "MAGRSGDSDEELLQTVRLIKLLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG" + "distance": 0.2712477396021701, + "protein": "MAGRSGDSDEELLQTVRLIKLLYQSS", + "aminoacids": "MAGRSGDSDEELLQTVRLIKLLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 6044, - "end": 6290, + "end": 6289, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.47888975762314323, "protein": "MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL", @@ -5313,9 +5313,9 @@ { "name": "env", "start": 6207, - "end": 8790, + "end": 8789, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.42511905011642803, "protein": "MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", @@ -5325,9 +5325,9 @@ { "name": "tat_exon2", "start": 8371, - "end": 8467, + "end": 8466, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4034761018001243, "protein": "RPTSQPRGDPTGQKESKKKVERETETDPDH", @@ -5337,9 +5337,9 @@ { "name": "rev_exon2", "start": 8372, - "end": 8648, + "end": 8647, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE", @@ -5349,9 +5349,9 @@ { "name": "nef", "start": 8791, - "end": 9412, + "end": 9411, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3303271812080537, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -5363,9 +5363,9 @@ { "name": "gag", "start": 808, - "end": 2308, + "end": 2307, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2880084183556755, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ", @@ -5375,9 +5375,9 @@ { "name": "pol", "start": 2100, - "end": 5112, + "end": 5111, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1880239208210378, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5387,9 +5387,9 @@ { "name": "vif", "start": 5056, - "end": 5635, + "end": 5634, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.41532297468972923, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH", @@ -5399,9 +5399,9 @@ { "name": "vpr", "start": 5574, - "end": 5865, + "end": 5864, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3120665742024965, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", @@ -5411,9 +5411,9 @@ { "name": "tat_exon1", "start": 5845, - "end": 6064, + "end": 6063, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ", @@ -5423,9 +5423,9 @@ { "name": "rev_exon1", "start": 5984, - "end": 6065, + "end": 6064, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", @@ -5435,9 +5435,9 @@ { "name": "vpu", "start": 6076, - "end": 6340, + "end": 6339, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.4955621301775147, "protein": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL", @@ -5447,9 +5447,9 @@ { "name": "env", "start": 6239, - "end": 8807, + "end": 8806, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4703403690377699, "protein": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL", @@ -5459,9 +5459,9 @@ { "name": "tat_exon2", "start": 8388, - "end": 8484, + "end": 8483, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPASQLRGDQTGPKEQKKKVERETETDPGN", @@ -5471,9 +5471,9 @@ { "name": "rev_exon2", "start": 8389, - "end": 8674, + "end": 8673, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4123815285339786, "protein": "DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC", @@ -5483,9 +5483,9 @@ { "name": "nef", "start": 8808, - "end": 9417, + "end": 9416, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.484764542936288, "protein": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC", diff --git a/tests/expected-results-large/errors.json b/tests/expected-results-large/errors.json index 70d4d31..eae4896 100644 --- a/tests/expected-results-large/errors.json +++ b/tests/expected-results-large/errors.json @@ -3,52 +3,52 @@ { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 2721" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 2721" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6322" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6322" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" + "message": "Smaller ORF vif at 5040-5618 can have maximum insertions 90, got 909" }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" + "message": "Smaller ORF vpr at 5558-5848 can have maximum deletions 30, got 66" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004" + "message": "Smaller ORF rev_exon1 at 5968-6045 contains an internal stop codon at 6004" }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions." + "message": "Smaller ORF vpu at 6060-6308 contains out of frame indels that impact 190 positions." }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 51 positions." }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 96" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 867" }, { "sequence_name": "KX505501.1", @@ -70,59 +70,59 @@ { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6123" }, { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" } ], "MN692074": [ { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 981" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 981" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6550" }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" + "message": "Smaller ORF vif at 5040-5618 can have maximum deletions 30, got 81" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" + "message": "Smaller ORF vpr at 5558-5848 can have maximum insertions 90, got 207" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" + "message": "Smaller ORF vpu at 6060-6308 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 40 positions." }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 204" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 882" }, { "sequence_name": "MN692074", @@ -140,12 +140,12 @@ { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 822" + "message": "ORF gag at 789-2291 contains an internal stop codon at 822" }, { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MN090335", @@ -172,7 +172,7 @@ { "sequence_name": "MN090376", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 822" + "message": "ORF gag at 789-2291 contains an internal stop codon at 822" }, { "sequence_name": "MN090376", @@ -256,7 +256,7 @@ { "sequence_name": "MK115211.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6889" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6889" }, { "sequence_name": "MK115211.1", @@ -295,59 +295,59 @@ { "sequence_name": "MK114705.1", "error": "DeletionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum deletions 30, got 186" + "message": "Smaller ORF nef at 8795-9415 can have maximum deletions 30, got 186" } ], "MK114856.1": [ { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 873" + "message": "ORF gag at 789-2291 contains an internal stop codon at 873" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2213" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2213" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6325" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6325" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5172" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5172" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5594" + "message": "Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5594" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5919" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5919" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8852" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8852" }, { "sequence_name": "MK114856.1", @@ -359,42 +359,42 @@ { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 834" + "message": "ORF gag at 789-2291 contains an internal stop codon at 834" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6349" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6349" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5373" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5373" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpr at 5558-5849 contains an internal stop codon at 5717" + "message": "Smaller ORF vpr at 5558-5848 contains an internal stop codon at 5717" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115009.1", @@ -416,7 +416,7 @@ { "sequence_name": "MK115387.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" } ], "MK115491.1": [], @@ -424,7 +424,7 @@ { "sequence_name": "MK116110.1", "error": "InternalStopInOrf", - "message": "ORF gag at 140-1643 contains an internal stop codon at 185" + "message": "ORF gag at 140-1642 contains an internal stop codon at 185" }, { "sequence_name": "MK116110.1", @@ -442,7 +442,7 @@ { "sequence_name": "MK114997.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6511" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6511" } ], "MK115518.1": [], @@ -472,47 +472,47 @@ { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 924" + "message": "ORF gag at 789-2291 contains an internal stop codon at 924" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6424" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6424" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5247" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5247" }, { "sequence_name": "MK115464.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains out of frame indels that impact 104 positions." + "message": "Smaller ORF tat_exon1 at 5829-6044 contains out of frame indels that impact 104 positions." }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115464.1", @@ -525,7 +525,7 @@ { "sequence_name": "MK115520.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2198" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2198" }, { "sequence_name": "MK115520.1", @@ -578,42 +578,42 @@ { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 927" + "message": "ORF gag at 789-2291 contains an internal stop codon at 927" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF pol at 2084-5096 contains an internal stop codon at 2183" + "message": "ORF pol at 2084-5095 contains an internal stop codon at 2183" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6550" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vif at 5040-5619 contains an internal stop codon at 5151" + "message": "Smaller ORF vif at 5040-5618 contains an internal stop codon at 5151" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5859" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5859" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6126" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6126" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 contains an internal stop codon at 8433" + "message": "Smaller ORF rev_exon2 at 8376-8651 contains an internal stop codon at 8433" }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", - "message": "Smaller ORF nef at 8795-9416 contains an internal stop codon at 8873" + "message": "Smaller ORF nef at 8795-9415 contains an internal stop codon at 8873" }, { "sequence_name": "MK115095.1", diff --git a/tests/expected-results-large/holistic.json b/tests/expected-results-large/holistic.json index f1d654f..6e9005c 100644 --- a/tests/expected-results-large/holistic.json +++ b/tests/expected-results-large/holistic.json @@ -6,9 +6,9 @@ "blast_matched_qlen": 1997, "blast_sseq_coverage": 0.2498456472525211, "blast_qseq_coverage": 1.2158237356034052, - "blast_sseq_orfs_coverage": 0.17663960024984385, + "blast_sseq_orfs_coverage": 0.17666166916541728, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN691959": { @@ -20,7 +20,7 @@ "blast_qseq_coverage": 1.1086063415148004, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN692074": { @@ -30,9 +30,9 @@ "blast_matched_qlen": 4178, "blast_sseq_coverage": 0.5042189750977567, "blast_qseq_coverage": 1.1728099569171853, - "blast_sseq_orfs_coverage": 0.4114928169893816, + "blast_sseq_orfs_coverage": 0.411544227886057, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN692145": { @@ -44,7 +44,7 @@ "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN090335": { @@ -54,9 +54,9 @@ "blast_matched_qlen": 9069, "blast_sseq_coverage": 0.9842560197571517, "blast_qseq_coverage": 1.0603153600176425, - "blast_sseq_orfs_coverage": 1.0003747657713928, + "blast_sseq_orfs_coverage": 1.000374812593703, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN090376": { @@ -66,9 +66,9 @@ "blast_matched_qlen": 8985, "blast_sseq_coverage": 0.9784935171846059, "blast_qseq_coverage": 1.0604340567612687, - "blast_sseq_orfs_coverage": 0.9943785134291068, + "blast_sseq_orfs_coverage": 0.9943778110944528, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115581.1": { @@ -80,7 +80,7 @@ "blast_qseq_coverage": 1.0046340179041602, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115690.1": { @@ -92,7 +92,7 @@ "blast_qseq_coverage": 1.0113530808132933, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115571.1": { @@ -104,7 +104,7 @@ "blast_qseq_coverage": 1.0113902490951672, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115514.1": { @@ -116,7 +116,7 @@ "blast_qseq_coverage": 1.0173736943082499, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115488.1": { @@ -128,7 +128,7 @@ "blast_qseq_coverage": 1.0325262392185388, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK115030.1": { @@ -140,7 +140,7 @@ "blast_qseq_coverage": 1.0655270655270654, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115498.1": { @@ -152,7 +152,7 @@ "blast_qseq_coverage": 1.0080329774865235, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115211.1": { @@ -164,7 +164,7 @@ "blast_qseq_coverage": 1.0598981399468557, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115158.1": { @@ -176,7 +176,7 @@ "blast_qseq_coverage": 0.9699223449633599, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 234, - "orfs_end": 8212, + "orfs_end": 8211, "blast_n_conseqs": 1 }, "MK114705.1": { @@ -188,7 +188,7 @@ "blast_qseq_coverage": 1.122622463075125, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK114856.1": { @@ -200,7 +200,7 @@ "blast_qseq_coverage": 1.0812493405085997, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MK115009.1": { @@ -212,7 +212,7 @@ "blast_qseq_coverage": 1.0590854784403172, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115387.1": { @@ -224,7 +224,7 @@ "blast_qseq_coverage": 1.040936952714536, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115491.1": { @@ -236,7 +236,7 @@ "blast_qseq_coverage": 1.0299299511780937, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK116110.1": { @@ -246,9 +246,9 @@ "blast_matched_qlen": 8967, "blast_sseq_coverage": 0.9957759004001778, "blast_qseq_coverage": 0.9972119995539199, - "blast_sseq_orfs_coverage": 0.998622244488978, + "blast_sseq_orfs_coverage": 0.9986220719027934, "orfs_start": 140, - "orfs_end": 8124, + "orfs_end": 8123, "blast_n_conseqs": 3 }, "MK115527.1": { @@ -260,7 +260,7 @@ "blast_qseq_coverage": 1.0056956017297753, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK114997.1": { @@ -272,7 +272,7 @@ "blast_qseq_coverage": 1.0516841524019878, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115518.1": { @@ -284,7 +284,7 @@ "blast_qseq_coverage": 0.9996854356715948, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115065.1": { @@ -296,7 +296,7 @@ "blast_qseq_coverage": 1.069459518124593, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 6 }, "MK115464.1": { @@ -308,7 +308,7 @@ "blast_qseq_coverage": 0.9893407844354756, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115530.1": { @@ -320,7 +320,7 @@ "blast_qseq_coverage": 0.9992665549036044, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115520.1": { @@ -330,9 +330,9 @@ "blast_matched_qlen": 9589, "blast_sseq_coverage": 0.9786993208479111, "blast_qseq_coverage": 0.987902805297737, - "blast_sseq_orfs_coverage": 1.0121174266083697, + "blast_sseq_orfs_coverage": 1.012118940529735, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115503.1": { @@ -344,7 +344,7 @@ "blast_qseq_coverage": 0.9953207861079338, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115570.1": { @@ -356,7 +356,7 @@ "blast_qseq_coverage": 1.0057986294148655, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115509.1": { @@ -368,7 +368,7 @@ "blast_qseq_coverage": 1.0197797498128942, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115702.1": { @@ -378,9 +378,9 @@ "blast_matched_qlen": 9098, "blast_sseq_coverage": 0.9874459765383824, "blast_qseq_coverage": 1.0596834469114091, - "blast_sseq_orfs_coverage": 1.0198625858838226, + "blast_sseq_orfs_coverage": 1.0198650674662668, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MK115095.1": { @@ -392,7 +392,7 @@ "blast_qseq_coverage": 1.060085367188355, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 2 }, "MK115490.1": { @@ -404,7 +404,7 @@ "blast_qseq_coverage": 1.0204343639670483, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MK115576.1": { @@ -416,7 +416,7 @@ "blast_qseq_coverage": 1.0342110943233327, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092466": { @@ -428,7 +428,7 @@ "blast_qseq_coverage": 1.1192442700805285, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092463": { @@ -440,7 +440,7 @@ "blast_qseq_coverage": 0.9884435190005205, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 140, - "orfs_end": 8124, + "orfs_end": 8123, "blast_n_conseqs": 2 }, "OQ092465": { @@ -452,7 +452,7 @@ "blast_qseq_coverage": 0.9620043482762191, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 200, - "orfs_end": 8208, + "orfs_end": 8207, "blast_n_conseqs": 2 }, "OQ092462": { @@ -464,7 +464,7 @@ "blast_qseq_coverage": 1.1301214741610048, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "OQ092464": { @@ -476,7 +476,7 @@ "blast_qseq_coverage": 0.9678735872750105, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 200, - "orfs_end": 8208, + "orfs_end": 8207, "blast_n_conseqs": 2 }, "OQ092467": { @@ -488,7 +488,7 @@ "blast_qseq_coverage": 1.0962157809983897, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-large/orfs.json b/tests/expected-results-large/orfs.json index 9d50b56..3bf4500 100644 --- a/tests/expected-results-large/orfs.json +++ b/tests/expected-results-large/orfs.json @@ -3,9 +3,9 @@ { "name": "env", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7623480451210163, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -15,9 +15,9 @@ { "name": "vif", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7647696476964769, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -27,9 +27,9 @@ { "name": "nef", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.764345579086969, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -39,9 +39,9 @@ { "name": "tat_exon1", "start": 1, - "end": 1750, + "end": 1749, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7680130480667754, "protein": "MRKLQNGIDCIQCMQGLLHQAR", @@ -51,9 +51,9 @@ { "name": "gag", "start": 336, - "end": 1824, + "end": 1823, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3997973809613161, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -63,9 +63,9 @@ { "name": "rev_exon1", "start": 1306, - "end": 1750, + "end": 1749, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.758082497212932, "protein": "MRTQIVKLF", @@ -75,9 +75,9 @@ { "name": "vpr", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.763687959047407, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -87,9 +87,9 @@ { "name": "vpu", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7672672672672673, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -99,9 +99,9 @@ { "name": "pol", "start": 1627, - "end": 1927, + "end": 1926, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7724330674761569, "protein": "GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -111,9 +111,9 @@ { "name": "tat_exon2", "start": 1746, - "end": 1824, + "end": 1823, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.7616257781032589, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", @@ -123,9 +123,9 @@ { "name": "rev_exon2", "start": 1747, - "end": 1927, + "end": 1926, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7620186257236345, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -137,9 +137,9 @@ { "name": "gag", "start": 639, - "end": 2142, + "end": 2141, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.0801186943620179, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -149,9 +149,9 @@ { "name": "pol", "start": 1934, - "end": 4946, + "end": 4945, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.054722889368558514, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -161,9 +161,9 @@ { "name": "vif", "start": 4890, - "end": 5469, + "end": 5468, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -173,9 +173,9 @@ { "name": "vpr", "start": 5408, - "end": 5699, + "end": 5698, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", @@ -185,21 +185,21 @@ { "name": "tat_exon1", "start": 5679, - "end": 5898, + "end": 5894, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5818, - "end": 5899, + "end": 5898, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", @@ -209,9 +209,9 @@ { "name": "vpu", "start": 5910, - "end": 6156, + "end": 6155, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7333193453629878, "protein": "MQPIQIAIVALVVAIIIAIVV", @@ -221,9 +221,9 @@ { "name": "env", "start": 6070, - "end": 8656, + "end": 8655, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.1405525502318391, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", @@ -233,9 +233,9 @@ { "name": "tat_exon2", "start": 8237, - "end": 8333, + "end": 8332, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6672629695885509, "protein": "RPTSQTRGDPTGPKE", @@ -245,9 +245,9 @@ { "name": "rev_exon2", "start": 8238, - "end": 8514, + "end": 8513, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.210025203024363, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", @@ -257,9 +257,9 @@ { "name": "nef", "start": 8657, - "end": 9278, + "end": 9277, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.06582796957284964, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -271,9 +271,9 @@ { "name": "nef", "start": 0, - "end": 4059, + "end": 4058, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7628009106462086, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -283,9 +283,9 @@ { "name": "env", "start": 2, - "end": 4115, + "end": 4114, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.76033143808071, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -295,9 +295,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.19470123431286457, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -307,9 +307,9 @@ { "name": "pol", "start": 2084, - "end": 4115, + "end": 4114, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.5617851221088768, "protein": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -319,9 +319,9 @@ { "name": "vif", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7631664499349805, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -331,9 +331,9 @@ { "name": "vpr", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.7629151983204618, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -343,9 +343,9 @@ { "name": "vpu", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7634058115037564, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -355,9 +355,9 @@ { "name": "tat_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7659115426105717, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -367,9 +367,9 @@ { "name": "rev_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7610789980732178, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -379,9 +379,9 @@ { "name": "tat_exon2", "start": 4080, - "end": 4164, + "end": 4163, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.769292994661058, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", @@ -391,9 +391,9 @@ { "name": "rev_exon2", "start": 4081, - "end": 4153, + "end": 4152, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7667894365645325, "protein": "YPVASPQMLHISSCFLPVLGLSG", @@ -405,9 +405,9 @@ { "name": "gag", "start": 775, - "end": 2281, + "end": 2280, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.20784453738651432, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", @@ -417,9 +417,9 @@ { "name": "pol", "start": 2070, - "end": 5085, + "end": 5084, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.14843087362171337, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", @@ -429,9 +429,9 @@ { "name": "vif", "start": 5029, - "end": 5608, + "end": 5607, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", @@ -441,9 +441,9 @@ { "name": "vpr", "start": 5547, - "end": 5838, + "end": 5837, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", @@ -453,9 +453,9 @@ { "name": "tat_exon1", "start": 5818, - "end": 6037, + "end": 6036, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -465,9 +465,9 @@ { "name": "rev_exon1", "start": 5957, - "end": 6038, + "end": 6037, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -477,9 +477,9 @@ { "name": "vpu", "start": 6049, - "end": 6298, + "end": 6297, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.520618556701031, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", @@ -489,9 +489,9 @@ { "name": "env", "start": 6212, - "end": 8783, + "end": 8782, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", @@ -501,9 +501,9 @@ { "name": "tat_exon2", "start": 8364, - "end": 8460, + "end": 8459, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -513,9 +513,9 @@ { "name": "rev_exon2", "start": 8365, - "end": 8641, + "end": 8640, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -525,9 +525,9 @@ { "name": "nef", "start": 8784, - "end": 9387, + "end": 9386, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", @@ -539,9 +539,9 @@ { "name": "gag", "start": 315, - "end": 1665, + "end": 1664, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.596665989022159, "protein": "MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ", @@ -551,9 +551,9 @@ { "name": "pol", "start": 1427, - "end": 4469, + "end": 4468, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.27887169154684477, "protein": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -563,9 +563,9 @@ { "name": "vif", "start": 4413, - "end": 4992, + "end": 4991, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH", @@ -575,9 +575,9 @@ { "name": "vpr", "start": 4931, - "end": 5222, + "end": 5221, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3808935556928146, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", @@ -587,21 +587,21 @@ { "name": "tat_exon1", "start": 5202, - "end": 5421, + "end": 5417, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", - "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*", - "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA" + "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", + "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG" }, { "name": "rev_exon1", "start": 5341, - "end": 5422, + "end": 5421, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", @@ -611,9 +611,9 @@ { "name": "vpu", "start": 5433, - "end": 5682, + "end": 5681, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5244381020335356, "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", @@ -623,9 +623,9 @@ { "name": "env", "start": 5596, - "end": 8158, + "end": 8157, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5152420275849952, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", @@ -635,9 +635,9 @@ { "name": "tat_exon2", "start": 7739, - "end": 7835, + "end": 7834, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6842105263157894, "protein": "RPSSQPRGDQTGPKE", @@ -647,9 +647,9 @@ { "name": "rev_exon2", "start": 7740, - "end": 8016, + "end": 8015, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", @@ -659,9 +659,9 @@ { "name": "nef", "start": 8159, - "end": 8813, + "end": 8812, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4891015417331206, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", @@ -673,9 +673,9 @@ { "name": "gag", "start": 522, - "end": 1590, + "end": 1589, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.6828741441147701, "protein": "MYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP", @@ -685,9 +685,9 @@ { "name": "pol", "start": 1382, - "end": 4394, + "end": 4393, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.23966680468616797, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGEDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQDEHEKYHSNWRAMASDFNIPPVVAKEIVACCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", @@ -697,9 +697,9 @@ { "name": "vif", "start": 4338, - "end": 4920, + "end": 4919, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.42479043044174425, "protein": "MENRWQVMVVWQVDRMRISMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRKKPPLPSVRKLTEDRWKEPQRTKGHRESHTMNGH", @@ -709,9 +709,9 @@ { "name": "vpr", "start": 4859, - "end": 5150, + "end": 5149, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.36116422349691957, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -721,21 +721,21 @@ { "name": "tat_exon1", "start": 5130, - "end": 5349, + "end": 5345, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.46628407460545196, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDSRNHQVSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTGGAGCCCTGGAAGCATCCAGGGAGTCAGCCTAGGACTGCGTGCACCAGTTGCTATTGTAAAAAGTGTTGCTATCATTGCCCGCGATGCTTCTTAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAACTCCTCAGGATAGCCGGAACCATCAAGTTTCTTTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5269, - "end": 5350, + "end": 5349, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5763097949886105, "protein": "MAGRSGDSDEELLRIAGTIKFLYQSSK", @@ -745,9 +745,9 @@ { "name": "vpu", "start": 5361, - "end": 5631, + "end": 5630, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5680096940321115, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLDMGHHAPWDVNDL", @@ -757,9 +757,9 @@ { "name": "env", "start": 5524, - "end": 8110, + "end": 8109, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.49863720871464445, "protein": "MRVKGTKKNWQPSWRWGTMLIWIWATMLLGMSMTCNAEDSWVTVYYGVPVWKEAATTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNINSTNINNTNSIEREMTNCSFNVTTVIRDKVQKQYALFYKLDVVQIKDDNTSYNTSYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCKNVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRRSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIRQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -769,9 +769,9 @@ { "name": "tat_exon2", "start": 7691, - "end": 7784, + "end": 7783, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -781,9 +781,9 @@ { "name": "rev_exon2", "start": 7692, - "end": 7968, + "end": 7967, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -793,9 +793,9 @@ { "name": "nef", "start": 8111, - "end": 8735, + "end": 8734, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5036770338593534, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTSANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -807,9 +807,9 @@ { "name": "gag", "start": 680, - "end": 2180, + "end": 2179, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -819,9 +819,9 @@ { "name": "pol", "start": 1972, - "end": 4984, + "end": 4983, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -831,9 +831,9 @@ { "name": "vif", "start": 4928, - "end": 5507, + "end": 5506, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -843,9 +843,9 @@ { "name": "vpr", "start": 5446, - "end": 5737, + "end": 5736, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -855,9 +855,9 @@ { "name": "tat_exon1", "start": 5717, - "end": 5936, + "end": 5935, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -867,21 +867,21 @@ { "name": "rev_exon1", "start": 5856, - "end": 5937, + "end": 5933, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5948, - "end": 6194, + "end": 6193, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -891,9 +891,9 @@ { "name": "env", "start": 6111, - "end": 8652, + "end": 8651, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -903,9 +903,9 @@ { "name": "tat_exon2", "start": 8233, - "end": 8329, + "end": 8328, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -915,9 +915,9 @@ { "name": "rev_exon2", "start": 8234, - "end": 8510, + "end": 8509, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -927,9 +927,9 @@ { "name": "nef", "start": 8653, - "end": 9268, + "end": 9267, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -941,9 +941,9 @@ { "name": "gag", "start": 777, - "end": 2286, + "end": 2285, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.24076694150363465, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQIMGQLQPALQTGSEELRSLYNTVATLYCVHQRIEVKDTKEALEKVEEEQNKSKKKAQQAAAGAGNSSQTSTSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATNSAAIMMQRGNFRNQRKSVKCFNCGKDGHIAKNCRAPRRKGCWKCGKEGHQMKDCPERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTTPSQKQEKIDQDLYPLASLKSLFGNDPSSQ", @@ -953,9 +953,9 @@ { "name": "pol", "start": 2078, - "end": 5090, + "end": 5089, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.185747174550021, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRGELQVWGGDNNSLSEAGEDRPGPVSFSFPQITLWQRPLVTIKVGGQLKEALLDTGADDTVLEDMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPYRKQNPNIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIALPEKESWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVIPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQEQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKSGKAGYVTNRGRQKVIPLTDTTNQKTELHAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQEAAYFILKLAGRWPVATIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDVIATDLQTKELQKQITKIQHFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -965,9 +965,9 @@ { "name": "vif", "start": 5034, - "end": 5613, + "end": 5612, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.39766435115272314, "protein": "MENRWQVMIVWQVDRMRIRRWHSLVKHHIYISGKARGWVYKHHYENTHPRISSKVYIPLGEARLAVTTYWGLHTGERDWHLGQGVSIEWRKKEYSTQVDPNLADQLIHLYYFDCFSESAIRNVILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSITKLTEDRWNKPQRTKGHRGNHTMNGH", @@ -977,9 +977,9 @@ { "name": "vpr", "start": 5552, - "end": 5843, + "end": 5842, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEQAPENQGPPREPYNEWALELLEELKSEAVRHFPRMWLHGLGQHIYETYGDTWTGVEALIRSLQQLLFIHFRIGCRHSRIGITPQRRTRNGASRS", @@ -989,21 +989,21 @@ { "name": "tat_exon1", "start": 5823, - "end": 6042, + "end": 6038, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", - "aminoacids": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPNLEPWKHPGSQPKTACTTCYCKQCCYHCQVCFITKGLGISYGRKKRRQRRGSPQDSQIHQASLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAATCTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCACTTGCTATTGTAAACAGTGTTGCTATCATTGCCAAGTTTGTTTCATAACCAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAACGACGAGGATCTCCTCAAGACAGTCAGATTCATCAAGCTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5962, - "end": 6043, + "end": 6042, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDNDEDLLKTVRFIKLLYQSSK", @@ -1013,9 +1013,9 @@ { "name": "vpu", "start": 6054, - "end": 6300, + "end": 6299, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.48542752364408415, "protein": "MQSLAILAIVALVVAAIIAIVVWTIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDHEELSALMEMGHHAPWDVDDL", @@ -1025,9 +1025,9 @@ { "name": "env", "start": 6217, - "end": 8800, + "end": 8799, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.49751604598034604, "protein": "MRVKGIMKNYQHLWRWGIMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYDTEAHNVWATHACVPTDPNPQEIGLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLHCTKLEINSTKKTNSTNNGTNINATDDSWGEMKNCSFNTTASIRDKVQREFALFYKLDIVPIDNDDINYRLISCNTSVLTQACPKVSFEPIPIHYCAPAGFAILKCRDKNFNGTGQCKNVSTVQCTHGIRPVVSTQLLFNGSLAEEEVVIKSENITDNTKTIIVQLNASVAIVCTRPNNNTRKSIPIGPGRAFYAAGDIIGDIRRAHCILNKTTWDNTIEQVAKKLREQFENKTIVFSESSGGDPEITMISFNCGGEFFYCNSVQLFNSTWHNNGSSTTGSSSSEGNITLPCKIKQIINMWQEVGKAMYAPPIRGPISCESNITGLLLTRDGGNDANGNNTETFRPGGGNMRDNWRSELYRYKVVKIEPLGVAPTRAQRRVVQREKRAVGLGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGLWGCSGKLICNTAVPWNTSWSNKSLDDIWHNMTWMEWEREIDNYTNIIYSLIEASQTQQEKNEQELLELDKWASLWNWFSISNWLWYIKIFIMIVGGLVGLRIVFTILSIVNRVRKGYSPLSFQTHLPAQRGPDRPEGTGDEGGEQDRDRSTHLVDGFLAIIWVDLRNLCLFLYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWRRELKNSAVSLLNATAIAVAEGTDRVIEGLRRAFRAIIHIPRRIRQGLERALQ", @@ -1037,9 +1037,9 @@ { "name": "tat_exon2", "start": 8381, - "end": 8474, + "end": 8473, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPTSQPRGDPTGPKEPETKVESKTETDPLT", @@ -1049,9 +1049,9 @@ { "name": "rev_exon2", "start": 8382, - "end": 8658, + "end": 8657, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.42982806877249113, "protein": "DPPPSPEGTRQARRNRRRRWRARQRQIHSLSGWILSNYLGRPAEPVPLPLPPLERLTLDCSEDCGTSGTQGVGSPQILVEPSAVLEAGTKE", @@ -1061,9 +1061,9 @@ { "name": "nef", "start": 8801, - "end": 9425, + "end": 9424, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.459649710885779, "protein": "MGGKWSKCSIVGWPTVRERIRRAEPAAEGVGAVSRDLEKHGAITSSNANNADCTWLEAQKEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGIIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVEPERVEEENKRENRCLLHPMSQHGMDDPEKEVLQWRFDSRLAFHHVARELHPEYYKN", @@ -1075,9 +1075,9 @@ { "name": "gag", "start": 579, - "end": 2079, + "end": 2078, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1087,9 +1087,9 @@ { "name": "pol", "start": 1871, - "end": 4883, + "end": 4882, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEAFLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1099,9 +1099,9 @@ { "name": "vif", "start": 4827, - "end": 5406, + "end": 5405, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1111,9 +1111,9 @@ { "name": "vpr", "start": 5345, - "end": 5636, + "end": 5635, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1123,21 +1123,21 @@ { "name": "tat_exon1", "start": 5616, - "end": 5835, + "end": 5831, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGCAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5755, - "end": 5836, + "end": 5835, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -1147,9 +1147,9 @@ { "name": "vpu", "start": 5847, - "end": 6093, + "end": 6092, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1159,9 +1159,9 @@ { "name": "env", "start": 6010, - "end": 8551, + "end": 8550, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1171,9 +1171,9 @@ { "name": "tat_exon2", "start": 8132, - "end": 8228, + "end": 8227, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1183,9 +1183,9 @@ { "name": "rev_exon2", "start": 8133, - "end": 8409, + "end": 8408, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1195,9 +1195,9 @@ { "name": "nef", "start": 8552, - "end": 9167, + "end": 9166, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1209,9 +1209,9 @@ { "name": "gag", "start": 584, - "end": 2084, + "end": 2083, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1221,9 +1221,9 @@ { "name": "pol", "start": 1876, - "end": 4888, + "end": 4887, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1233,9 +1233,9 @@ { "name": "vif", "start": 4832, - "end": 5411, + "end": 5410, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1245,9 +1245,9 @@ { "name": "vpr", "start": 5350, - "end": 5641, + "end": 5640, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1257,9 +1257,9 @@ { "name": "tat_exon1", "start": 5621, - "end": 5840, + "end": 5839, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1269,21 +1269,21 @@ { "name": "rev_exon1", "start": 5760, - "end": 5841, + "end": 5837, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5852, - "end": 6098, + "end": 6097, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1293,9 +1293,9 @@ { "name": "env", "start": 6015, - "end": 8556, + "end": 8555, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1305,9 +1305,9 @@ { "name": "tat_exon2", "start": 8137, - "end": 8233, + "end": 8232, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1317,9 +1317,9 @@ { "name": "rev_exon2", "start": 8138, - "end": 8414, + "end": 8413, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1329,9 +1329,9 @@ { "name": "nef", "start": 8557, - "end": 9172, + "end": 9171, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1343,9 +1343,9 @@ { "name": "gag", "start": 707, - "end": 2207, + "end": 2206, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1355,9 +1355,9 @@ { "name": "pol", "start": 1999, - "end": 5011, + "end": 5010, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1367,9 +1367,9 @@ { "name": "vif", "start": 4955, - "end": 5534, + "end": 5533, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGDIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1379,9 +1379,9 @@ { "name": "vpr", "start": 5473, - "end": 5764, + "end": 5763, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1391,9 +1391,9 @@ { "name": "tat_exon1", "start": 5744, - "end": 5963, + "end": 5962, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -1403,21 +1403,21 @@ { "name": "rev_exon1", "start": 5883, - "end": 5964, + "end": 5960, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5975, - "end": 6221, + "end": 6220, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1427,9 +1427,9 @@ { "name": "env", "start": 6138, - "end": 8679, + "end": 8678, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNITNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIVFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1439,9 +1439,9 @@ { "name": "tat_exon2", "start": 8260, - "end": 8356, + "end": 8355, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1451,9 +1451,9 @@ { "name": "rev_exon2", "start": 8261, - "end": 8537, + "end": 8536, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1463,9 +1463,9 @@ { "name": "nef", "start": 8680, - "end": 9295, + "end": 9294, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDGEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1477,9 +1477,9 @@ { "name": "gag", "start": 176, - "end": 1685, + "end": 1684, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27304152847199525, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRKNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", @@ -1489,9 +1489,9 @@ { "name": "pol", "start": 1477, - "end": 4489, + "end": 4488, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.26443159013103534, "protein": "FFREDLAFPQGEAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -1501,9 +1501,9 @@ { "name": "vif", "start": 4433, - "end": 5012, + "end": 5011, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -1513,9 +1513,9 @@ { "name": "vpr", "start": 4951, - "end": 5242, + "end": 5241, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEDIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -1525,9 +1525,9 @@ { "name": "tat_exon1", "start": 5222, - "end": 5441, + "end": 5440, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -1537,21 +1537,21 @@ { "name": "rev_exon1", "start": 5361, - "end": 5442, + "end": 5438, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5453, - "end": 5699, + "end": 5698, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5682727709300466, "protein": "MHILEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSAIVEMGHLVPWDGDDM", @@ -1561,9 +1561,9 @@ { "name": "env", "start": 5616, - "end": 8217, + "end": 8216, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5091484869809996, "protein": "MKVTGTRRNYQQLWRWGILFLGMVMICSARNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNNTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAMGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWNPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -1573,9 +1573,9 @@ { "name": "tat_exon2", "start": 7798, - "end": 7891, + "end": 7890, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -1585,9 +1585,9 @@ { "name": "rev_exon2", "start": 7799, - "end": 8075, + "end": 8074, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -1597,9 +1597,9 @@ { "name": "nef", "start": 8218, - "end": 8860, + "end": 8859, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNTDVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -1611,9 +1611,9 @@ { "name": "gag", "start": 663, - "end": 2163, + "end": 2162, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -1623,9 +1623,9 @@ { "name": "pol", "start": 1955, - "end": 4967, + "end": 4966, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -1635,9 +1635,9 @@ { "name": "vif", "start": 4911, - "end": 5490, + "end": 5489, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -1647,9 +1647,9 @@ { "name": "vpr", "start": 5429, - "end": 5720, + "end": 5719, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -1659,21 +1659,21 @@ { "name": "tat_exon1", "start": 5700, - "end": 5919, + "end": 5915, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5839, - "end": 5920, + "end": 5919, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -1683,9 +1683,9 @@ { "name": "vpu", "start": 5931, - "end": 6177, + "end": 6176, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -1695,9 +1695,9 @@ { "name": "env", "start": 6094, - "end": 8635, + "end": 8634, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -1707,9 +1707,9 @@ { "name": "tat_exon2", "start": 8216, - "end": 8312, + "end": 8311, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -1719,9 +1719,9 @@ { "name": "rev_exon2", "start": 8217, - "end": 8493, + "end": 8492, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -1731,9 +1731,9 @@ { "name": "nef", "start": 8636, - "end": 9251, + "end": 9250, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -1745,9 +1745,9 @@ { "name": "gag", "start": 250, - "end": 1753, + "end": 1752, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.25132972351334526, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQKIEIKDTKEALDKIEEEQNKSKKKTQQAAADTGHNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNAVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPLSSLKSLFGNDP", @@ -1757,9 +1757,9 @@ { "name": "pol", "start": 1545, - "end": 4557, + "end": 4556, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.2540106951871657, "protein": "FFRENLAFPQGKARELSSKQDRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPSVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISRIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNLPPVIAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDGCVASRQDED", @@ -1769,9 +1769,9 @@ { "name": "vif", "start": 4501, - "end": 5083, + "end": 5082, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.40472673559822736, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKLTEDRWNEPQRTKGHRESHTMNGH", @@ -1781,9 +1781,9 @@ { "name": "vpr", "start": 5022, - "end": 5313, + "end": 5312, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3808935556928146, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRTLQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -1793,9 +1793,9 @@ { "name": "tat_exon1", "start": 5293, - "end": 5512, + "end": 5511, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPRLEPWKHPGSQPKTACTSCYCKRCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", @@ -1805,9 +1805,9 @@ { "name": "rev_exon1", "start": 5432, - "end": 5513, + "end": 5512, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSGDSDEELLRITRTIKFLYQNSE", @@ -1817,9 +1817,9 @@ { "name": "vpu", "start": 5524, - "end": 5794, + "end": 5793, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5776066350710902, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVFIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWEVNDL", @@ -1829,9 +1829,9 @@ { "name": "env", "start": 5687, - "end": 8198, + "end": 8197, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.6638103647692366, "protein": "MHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARHLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEVIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -1841,9 +1841,9 @@ { "name": "tat_exon2", "start": 7779, - "end": 7872, + "end": 7871, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -1853,9 +1853,9 @@ { "name": "rev_exon2", "start": 7780, - "end": 8056, + "end": 8055, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGCGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -1865,9 +1865,9 @@ { "name": "nef", "start": 8199, - "end": 8823, + "end": 8822, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5093153589821267, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDPDKEVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -1879,9 +1879,9 @@ { "name": "gag", "start": 316, - "end": 1819, + "end": 1818, "subtype_start": 234, - "subtype_end": 1731, + "subtype_end": 1730, "orientation": "forward", "distance": 0.38499312512276596, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFNTVAVLYCVHQRIEIKDTKEALDKIEEEQNKSKKKTQQAAADPGNSNQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASVMMQKGNFRSQRKMVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRTEPTAPPEESFSFGEKTTTPSQKQEPIDQELYPMSSLKSLFGNDP", @@ -1891,9 +1891,9 @@ { "name": "pol", "start": 1611, - "end": 4623, + "end": 4622, "subtype_start": 1526, - "subtype_end": 4535, + "subtype_end": 4534, "orientation": "forward", "distance": 0.30843043180260443, "protein": "FFRENLAFPQGEARELSSKQNRTNSPTRGELQFWGKDNNSFSEAGADRPGTIPYVFPQITLWQRPLVTVRIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVKQYDQISVEICGHKAIGTVLIGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICKEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDMVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGAKALTEVVPLTEEAELELAENREILKEPVHGVYYDPTKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWESWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKSGKAGYVTDRGRQKVISLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIQKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEDHEKYHSNWRAMASDFNIPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVTTIHTDNGPNFTSNAVKAACWWAGVKQEFGIPYNPQSQGVVESMNKQLKQIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDGCVASRQDED", @@ -1903,9 +1903,9 @@ { "name": "vif", "start": 4567, - "end": 5149, + "end": 5148, "subtype_start": 4479, - "subtype_end": 5061, + "subtype_end": 5060, "orientation": "forward", "distance": 0.48399487836107546, "protein": "MENRWQVMVVWQVDRMRINMWKSLVKYHIHNSGKARGWCYRHHYESRHPRISSEVHIPLGGEARLVVTTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADQLIHLYYFNCFSESAIRQAILGHRVSPRCEYQAGHNKVGSLQYLALIALIPPKRRKPPLPSVRKRTEDRWNEPQRTKGHRESHTMNGH", @@ -1915,9 +1915,9 @@ { "name": "vpr", "start": 5088, - "end": 5379, + "end": 5378, "subtype_start": 5000, - "subtype_end": 5291, + "subtype_end": 5290, "orientation": "forward", "distance": 0.43053960964408733, "protein": "MERAPEDQGPQREPYNEWTLELLEELKREAVRHFPRAWLHGLGQHIYETYGDTWAGVEALIRILQQLVFIHFRIGCQHSRIGILTHRRARNGASRS", @@ -1927,9 +1927,9 @@ { "name": "tat_exon1", "start": 5359, - "end": 5578, + "end": 5577, "subtype_start": 5271, - "subtype_end": 5487, + "subtype_end": 5486, "orientation": "forward", "distance": 0.4464285714285715, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKKCCYHCPRCFLTKGLGISYGRKKRRQRRRTPQDNQNHQVSLSKQ", @@ -1939,9 +1939,9 @@ { "name": "rev_exon1", "start": 5498, - "end": 5579, + "end": 5578, "subtype_start": 5410, - "subtype_end": 5488, + "subtype_end": 5487, "orientation": "forward", "distance": 0.5622384937238494, "protein": "MAGRSGDSDEELLKITRTIKFLYQNSE", @@ -1951,9 +1951,9 @@ { "name": "vpu", "start": 5590, - "end": 5860, + "end": 5859, "subtype_start": 5502, - "subtype_end": 5748, + "subtype_end": 5747, "orientation": "forward", "distance": 0.5374618963580942, "protein": "MQSLEILAIVALVVAFIIAIVVWSIVLIEYRKIRRQKRIDRILDRIRERAEDSGNESEGDQEELAALVEMGNHAHLGMGHHAPWDVNDL", @@ -1963,9 +1963,9 @@ { "name": "env", "start": 5753, - "end": 8315, + "end": 8314, "subtype_start": 5665, - "subtype_end": 8212, + "subtype_end": 8211, "orientation": "forward", "distance": 0.5078662118966413, "protein": "MRVKGTKKNWQPSWRWGTMLIWGWATMLLGMSMTCNAEDSWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVELNVTENFNAWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTELKNSTGEMKNCSFNATTAIRDKVQKQYALFYRLDVVQIKDDNTSYNTRYRLINCNSSTITQACPKVSFEPIPIHYCAPAGFAILKCKDKNFNGTGLCENVSTVQCTHGIRPVVSTQLLLNGSLAEGDVVIRSKNFSNSAQTIIVQLNETVEINCTRPNNNTRKSIHIGPGRAFYATGDIIGDIRQAHCNISRAKWNETLKKIADKLREQFKRETIVFNQSSGGDPEIVMHSFNCRGEFFYCNTTQLFNSTWNSTTGVNGTGANNTEVNIITLPCKIKQIVNMWQEVGKAMYAPPISGQISCSSNITGLLLLRDGGNSNDTDNTTEIFRPGGGDMRDNWRSELYKYKVVQIEPLGVAPTKARRRVVQREKRAVGIGALFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTNVPWNSSWSNKNLSYIWNNMTWMQWEKEIDNYTEEIYNLIEQSQNQQEKNEQELLELDKWASLWTWFDITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTLLPAARGPDRPEGIGEEGGERDRDRSSHLAHGFLTIIWVDLRSLFLFSYHHLRDLLLIVARGVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRFIEVLQRIFRAIIHIPTRIRQGLERALL", @@ -1975,9 +1975,9 @@ { "name": "tat_exon2", "start": 7896, - "end": 8004, + "end": 8003, "subtype_start": 7793, - "subtype_end": 7901, + "subtype_end": 7900, "orientation": "forward", "distance": 0.5826923076923078, "protein": "RPSSQPRGDPTGPKESEKKVERETETDPVT", @@ -1987,9 +1987,9 @@ { "name": "rev_exon2", "start": 7897, - "end": 8173, + "end": 8172, "subtype_start": 7794, - "subtype_end": 8070, + "subtype_end": 8069, "orientation": "forward", "distance": 0.45968205324650446, "protein": "DPPPSREGTRQARRNRRRRWRERQRQIQSLSAWILNNYLGRPAEPVPLQLPPLERLTLDCSEGSGTSGTQGVGSPQVLVESPAVLEPGTKE", @@ -1999,9 +1999,9 @@ { "name": "nef", "start": 8316, - "end": 8940, + "end": 8939, "subtype_start": 8213, - "subtype_end": 8834, + "subtype_end": 8833, "orientation": "forward", "distance": 0.5254870367657829, "protein": "MGGIFSKRNGGGWPAIRERMRRAQPAADGVGAASRDLERHGALTSNNTPANNADCAWLEAQEEGEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIYSQQRQDILDLWVYNTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPMEPEDVEKATEGEDNILLHPVNQHGMDDSEREVLVWKFDSRLAFRHVAREIHPEYYKNC", @@ -2013,9 +2013,9 @@ { "name": "gag", "start": 532, - "end": 2047, + "end": 2046, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27270615563298484, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNTIAVLYCVHQRIDVKDTKEALNKIEEEQNKSKKKAQQAAADTGNSSQSSQVSQNYPIVQNHQGQMVYQALSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIIMGLNKIVRMYSPISILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQATGGATNIMMQKGNFRNQGKPIKCFNCGKEGHLARNCRAPRKKGCWKCGKEGHQMKDCSERQANFLGKIWPSHKGRPGNFLQNRPEPTAPPEESFRFGEETTAPPQKQEPTDKELYPFSSLKSLFGNDPSSQ", @@ -2025,9 +2025,9 @@ { "name": "pol", "start": 1839, - "end": 4851, + "end": 4850, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.21944123990570308, "protein": "FFRENLAFPQGKAREFPPEQTRANSPTRRELQVWGRDNSSPSEAGADRQGTVSLLFPQITLWQRPLVTVKIGGQLKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTKIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDESFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIEQHRAKVENLREHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVITLTEEAELELAENREILKEPVHGVYYDPSKDLVAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIATESIVVWGKIPKFRLPIQKETWETWWMEYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVIPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQEDHEKYHSNWKAMASDFNIPPVVAKEIIASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGEYCAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2037,9 +2037,9 @@ { "name": "vif", "start": 4795, - "end": 5374, + "end": 5373, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWVYRHHYESTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYNTQVDPGLADQLIHMYYFDCFSESAIRQAILGHRVSPSCEYQAGHNKVGSLQYLALAVLVAPKKIKPPLPSVARLTEDRWNKPRKIKGHRESHTMNGH", @@ -2049,9 +2049,9 @@ { "name": "vpr", "start": 5313, - "end": 5598, + "end": 5597, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.39401343921808174, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPREWLHSLGQHIYETYGDTWAGVGAIIRILQQLLFIHFRIGCHHSRIGILRRTRNGARRS", @@ -2061,9 +2061,9 @@ { "name": "tat_exon1", "start": 5578, - "end": 5797, + "end": 5796, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.5138258357408172, "protein": "MEPVDPRLEPWKHPGSQPRTPCNNCYCKKCCFHCQVCFTKKGLGISYGRKKRRQRRGPPRDSQIHQVPLPKQ", @@ -2073,9 +2073,9 @@ { "name": "rev_exon1", "start": 5717, - "end": 5798, + "end": 5797, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5940834141610087, "protein": "MAGRSGDRDEDLLETVRFIKFLYQNSK", @@ -2085,9 +2085,9 @@ { "name": "vpu", "start": 5809, - "end": 6055, + "end": 6054, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5727186311787074, "protein": "MQPLEISAIVALVVVAIIAIVVWTIVLLEYRKILRQKKIDRLINRISERAEDSGNESDGDQEELSALMEMGRLAPWNVDDL", @@ -2097,9 +2097,9 @@ { "name": "env", "start": 5972, - "end": 8549, + "end": 8548, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5021538905210794, "protein": "MRVTGIKKNCQLLWRWGALLLGMLMICSATNMWVTVYYGVPVWKDATTTLFCASDAKAYDTEIHNVWATHACVPTDPDPQEVVLENVTENYNMGKNNMVEQMHEDIISLWDQSLKPCVLLTPFCVTLNCTDANITSTNNSRDKKEGESTLEETKGEIKNCSFNMTSSMSDKSQKQRALFYKLDVVQIDETNNNSYRLISCNTSVVTQACPKVSFDPIPIHYCAPAGFAILKCNNKKFNGTGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSENFTNNAKTIIVQLKTPVQINCTRPNNNTRKRISMGPGRVIYATGQIIGDIRKAHCNISRAEWNTTLKQIVTQLRKQWNRTIIFNSSSGGDPEIVMHSFNCRGEFFYCNTTKLFNSTWPRNSTWNNTEGSNDTEIITLPCRIKQIVNRWQEVGKAMYAPPIQGQISCSSNITGLLLVRDGGINTSESNETFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGMLGAMFLGLLGAAGSTMGAASVTLTVQTRLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARLLAVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNRSYEDIWNNMTWMEWEKEIDNYTGLIYTLIEKSQNQQEINEQELLSLDKWASLWNWFNITNWLWYIKIFIMIVGGLIGLRIVFAVLSIVNRVRQGYSPLSLQTPRPAPRGPDRPEEIEEGGGERDRDRSVRLVTGFFALFWDDLRSLCLFSYHHLRDLILIVVRVVEILGRRGWEALKYWWNLLQYWSQEIKNSAISLLNATAIAVAEGTDRIIGVVQRTWRAFIHIPRRIRQGFERALL", @@ -2109,9 +2109,9 @@ { "name": "tat_exon2", "start": 8130, - "end": 8226, + "end": 8225, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6074396517609815, "protein": "RPPAQPQGDPTGPKKSKKEVEKETETDQCD", @@ -2121,9 +2121,9 @@ { "name": "rev_exon2", "start": 8131, - "end": 8407, + "end": 8406, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.47688921496698455, "protein": "DPPPSPKGTRQARRNRRRRWRKRQRQISAISDWILRTFLGRSTKPVPLQLPPLERLNLDCSEGCGNSGTQGVGSPQILVESPAVLESGNKE", @@ -2133,9 +2133,9 @@ { "name": "nef", "start": 8550, - "end": 8985, + "end": 8984, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.6017710152157637, "protein": "MGGKWSKKSGGGWPAVREKMKRTEPAAEGVGAASRDLDKYGAITSSNTAQTNPDCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDMSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGGCFK", @@ -2147,9 +2147,9 @@ { "name": "gag", "start": 120, - "end": 2022, + "end": 2021, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7511039743075072, "protein": "MTKTLLVQNANPDCKTILKALGPAATLEEMMTACQKVRRPGHKAKVLAEAMSQATGAANIMMQRGNFKNQRKPVKCFNCGKEKHIAKNCKAPKKKGC", @@ -2159,9 +2159,9 @@ { "name": "pol", "start": 1787, - "end": 4826, + "end": 4825, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7637180771917039, "protein": "ASQIYAKIKVKQLCKLLKRTKALTEVVPLTEEAELELAENRKILKDPVHRAYYDPAKDLIAELQKQREGQWTYQIYQKPFKNLKTEKYARTKGAHTNDVKQLTEAVQKISTESIVI", @@ -2171,9 +2171,9 @@ { "name": "vif", "start": 4425, - "end": 5349, + "end": 5348, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7566838361540349, "protein": "MIVWQVDRMKIRTWKSLVKYHMYISKKAKK", @@ -2183,9 +2183,9 @@ { "name": "vpr", "start": 5033, - "end": 5579, + "end": 5578, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.7334692430420138, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", @@ -2195,21 +2195,21 @@ { "name": "tat_exon1", "start": 5486, - "end": 5780, + "end": 5776, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7619181418001311, "protein": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS", - "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAVN", - "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAAT" + "aminoacids": "MLFIHFRIKCHHSRIGIVLQRRARNRASRS*TRALEASRKSA*DSLYQLLL*KVLLSLPSVFYTKSLRHLLWQEEAETETKISSRQSDSSSSSTKAV", + "nucleotides": "ATGCTGTTTATTCATTTCAGAATTAAGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATAGAGCCAGTAGATCATAGACTAGAGCCCTAGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTA" }, { "name": "rev_exon1", "start": 5698, - "end": 5779, + "end": 5778, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", @@ -2219,9 +2219,9 @@ { "name": "vpu", "start": 5790, - "end": 6039, + "end": 6038, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7407973896196594, "protein": "MQPLKILAIVALVVAAIIAIVV", @@ -2231,9 +2231,9 @@ { "name": "env", "start": 5953, - "end": 8521, + "end": 8520, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7529994904340572, "protein": "MTNCSFNITTEIRDKVRKEYALFYKLDVMPIDKDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPASFAILKCKDEMFNRTRPCKNVSTVQCTHRIRPVVSTQLLLNSSLAEKKIVLRSENFTDNTKNIIVQLNRSIVINCTRPNNNTRKSISVAKRAIYATRQIIEDIRQAHCNISETD", @@ -2243,9 +2243,9 @@ { "name": "nef", "start": 7916, - "end": 9176, + "end": 9175, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7587548638132295, "protein": "MSLHRMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", @@ -2255,9 +2255,9 @@ { "name": "tat_exon2", "start": 8102, - "end": 8198, + "end": 8197, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.7134052388289676, "protein": "RPSSQPQEDQTGPKE", @@ -2267,9 +2267,9 @@ { "name": "rev_exon2", "start": 8103, - "end": 8379, + "end": 8378, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6888374145157732, "protein": "ILTTHLRRPAKPVPFQLPPLKRLTLDCAEDCANSRTQEVRDPQVLVESPAVLNSGTKE", @@ -2281,9 +2281,9 @@ { "name": "gag", "start": 302, - "end": 1715, + "end": 1714, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7484174646972894, "protein": "MTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVRGPGHKARVLAEAMSQVTKSASIIVQGGNFKNQRKNVKCFNCGKERHTAKNCRAPKKKGC", @@ -2293,9 +2293,9 @@ { "name": "pol", "start": 1613, - "end": 4625, + "end": 4624, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7535201229073285, "protein": "AEIKQEFSIPYNPQSQRVVKSMNNKLKKIIGQVKDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED", @@ -2305,9 +2305,9 @@ { "name": "vif", "start": 4289, - "end": 4988, + "end": 4987, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7624714704923379, "protein": "MAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFQVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYRKQMAGDDCVASRQDED", @@ -2317,9 +2317,9 @@ { "name": "vpr", "start": 5087, - "end": 5378, + "end": 5377, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.6737199868435482, "protein": "MEQVPEDQRPQKEPYNKWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDT", @@ -2329,21 +2329,21 @@ { "name": "tat_exon1", "start": 5235, - "end": 5577, + "end": 5573, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.6325105553751218, "protein": "MTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", - "aminoacids": "MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ*", - "nucleotides": "ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA" + "aminoacids": "MEILRQR*KP**EPCNNCCSFISELGVNIAG*ELFDRGEQEIEPVDPSLEP*KHPGSQPMTACNNCYCKRCCFHCQVCFTTKSLGISYGRKKQRQRRRASHSSQNHQAALPEQ", + "nucleotides": "ATGGAGATACTTAGGCAGAGGTAGAAGCCATAATAAGAACCCTGCAACAACTGTTGTTCATTCATTTCAGAATTAGGTGTCAACATAGCAGGATAGGAATTATTCGACAGAGGAGAGCAAGAAATAGAGCCAGTAGATCCTAGCTTAGAGCCCTAGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACAACAAAAAGCTTAGGCATCTCCTATGGCAGGAAGAAGCAGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG" }, { "name": "rev_exon1", "start": 5497, - "end": 5578, + "end": 5577, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.564475664826894, "protein": "MAGRSRDSDEELLTAVRIIKRLYQSSK", @@ -2353,9 +2353,9 @@ { "name": "vpu", "start": 5589, - "end": 5835, + "end": 5834, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.6256860592755216, "protein": "MHALEIAAIAGLVVAAIIAIVVWSIVLIEYKKILRQRKIDRLINRIRERAEDSGNESDEDQEELSALVEMRHLVP", @@ -2365,9 +2365,9 @@ { "name": "env", "start": 5752, - "end": 8353, + "end": 8352, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7518870380010406, "protein": "MKEKGEIKNCSFNVTTGIRDKVTKEHALFYKLNVVPIDEDSKNTTGKYKMINCNTSVITQACPKVSFKPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEKIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYRTDIIRDIRQAHYNISKKD", @@ -2377,9 +2377,9 @@ { "name": "nef", "start": 7748, - "end": 8996, + "end": 8995, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7328145265888457, "protein": "MTYKRALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFR", @@ -2389,9 +2389,9 @@ { "name": "tat_exon2", "start": 7934, - "end": 8027, + "end": 8026, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5633802816901408, "protein": "RPSSQPREDPTGPKEQKKEVERKTEAHPRD", @@ -2401,9 +2401,9 @@ { "name": "rev_exon2", "start": 7935, - "end": 8211, + "end": 8210, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6781884553958476, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLNCGENCRTSRTQKVRSTEVLVESPAVLESGNKE", @@ -2415,9 +2415,9 @@ { "name": "gag", "start": 292, - "end": 1795, + "end": 1794, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.25442849599155104, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKRYKLKHIVWASRELERFAVNPGLLETTEGCKQILEQLQPSLPTGSEELRSLFNTVATLYCVHKRIEVQDTKEALEKIEEEQNKSKKKAQQAVADTGSTSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPVAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKVLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSSKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", @@ -2427,9 +2427,9 @@ { "name": "pol", "start": 1587, - "end": 4599, + "end": 4598, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.17509882471546434, "protein": "FFREDLAFLQGKARELSSEQTRANSPTRGELQVWGGDSNSSSEAGAGGQGSVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVQLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSIPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMIKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPDKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLKGAKALTEVIQLTEEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARTRGTHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTSRGRQKVVSLTDTTNQKTELQAICLALQDSGLEVNIVTDSQYALGIIQAQPDRSESEIVNQIIEQLIKKERVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHNNWRAMASDFNLPPVVAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKAIHTDNGTNFTSATVKAACWWAGIKQECGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2439,9 +2439,9 @@ { "name": "vif", "start": 4543, - "end": 5122, + "end": 5121, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.34158090650317496, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTYWGLHTGERDWHLGQGVSIECRERKYSTQVTPDLADQLIHLYYFDCFAESAIREAILGHRVSPRCEYQAGHNKVGSLQYLALTALVTPKKTKPPLPSVTKLTEDRWNKPQKTKGHRGSQTMNGH", @@ -2451,9 +2451,9 @@ { "name": "vpr", "start": 5061, - "end": 5352, + "end": 5351, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", @@ -2463,9 +2463,9 @@ { "name": "tat_exon1", "start": 5332, - "end": 5551, + "end": 5550, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEPVDPRLEPWKHPGSQPKTPCTKCYCKKCCFHCQVCFITKGLGISYGRKKRRQRRRPPQDSQTHQVPLPKQ", @@ -2475,9 +2475,9 @@ { "name": "rev_exon1", "start": 5471, - "end": 5552, + "end": 5551, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", @@ -2487,9 +2487,9 @@ { "name": "vpu", "start": 5563, - "end": 5809, + "end": 5808, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5560235888795282, "protein": "MQSLYILTIVALVVAAILAIVVWAIVLIEYKKILKQRRIDRLIDRIIDRAEDSGNESEGDQEELSALVEMGHHAPWNVDDL", @@ -2499,9 +2499,9 @@ { "name": "env", "start": 5726, - "end": 8288, + "end": 8287, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5276672448389619, "protein": "MRVKEIKRSYQHLWRWGIMLLGMLMIYSTADQWWVTVYYGVPVWREANTTLFCASDAKAYSTEAHNVWATHACVPTDPNPQEIVIGNVTEDFNMWKNNMVDQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDIRNSTVTSNTTTWGEMTNCTFNITTSIKDKMKKEAALFYKIDLVEIDEEKNNSSTRYRLINCNTSAITQACPKVSFEPIPIHFCAPAGFAILKCNNKKFSGKGPCTNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIQIFCIRPNNNTRKSINIGPGRAFYTTGDIIGDIRQAHCNISGNWNNTLKQIATQLGKQLNQTQQIIFNSSAGGDPEIVTHSFNCGGEFFYCNSSSLFNSTWTKNGTGSWQSNDTQNGNITLQCRIKQIINLWQGVGKAMYAPPISGQINCTSNITGLVLTRDGGKVINETETFRPGGGNMKDNWRSELYKYKVVRIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASIALTEQARRVLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGLWGCSGKLICTTTVPWNRSWGGHNKNLDDIWGNMTWMEWEKEIDNYTSLIYTLITESHSQQEKNEQELLALDKWASLWNWFDISQWLWYIKIFIMIVGGLVGLRIVFAVLSIVNKVRQGYSPLSFQTLLPAPRGADRPEGIEEGGGERDKGRSGRLVNGFLALIWDDLRSLCLFSYHRLSDLLLIVIRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNTTAIVVAEGTDRIIEILQRIGRAFLHIPRRIRQGLERALL", @@ -2511,9 +2511,9 @@ { "name": "tat_exon2", "start": 7869, - "end": 7965, + "end": 7964, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQLRGEPTGPKE", @@ -2523,9 +2523,9 @@ { "name": "rev_exon2", "start": 7870, - "end": 8146, + "end": 8145, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.32366339007432277, "protein": "DPPPSSEGSRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDCDQDCGTSGTQGVGSPQILVESPAVLESGTKE", @@ -2535,9 +2535,9 @@ { "name": "nef", "start": 8289, - "end": 8940, + "end": 8939, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4631394979345408, "protein": "MGGKWSKSSRVGWNAVRERMRRAQPTADRERAEPAADGVGAASRDLEKYGALTSRNTAATNADCAWLEAQEEEDEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHGMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", @@ -2549,9 +2549,9 @@ { "name": "gag", "start": 521, - "end": 2021, + "end": 2020, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -2561,9 +2561,9 @@ { "name": "pol", "start": 1813, - "end": 4825, + "end": 4824, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2573,9 +2573,9 @@ { "name": "vif", "start": 4769, - "end": 5348, + "end": 5347, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -2585,9 +2585,9 @@ { "name": "vpr", "start": 5287, - "end": 5578, + "end": 5577, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -2597,9 +2597,9 @@ { "name": "tat_exon1", "start": 5558, - "end": 5777, + "end": 5776, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2609,21 +2609,21 @@ { "name": "rev_exon1", "start": 5697, - "end": 5778, + "end": 5774, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5789, - "end": 6035, + "end": 6034, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -2633,9 +2633,9 @@ { "name": "env", "start": 5952, - "end": 8493, + "end": 8492, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -2645,9 +2645,9 @@ { "name": "tat_exon2", "start": 8074, - "end": 8170, + "end": 8169, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2657,9 +2657,9 @@ { "name": "rev_exon2", "start": 8075, - "end": 8351, + "end": 8350, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2669,9 +2669,9 @@ { "name": "nef", "start": 8494, - "end": 9109, + "end": 9108, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -2683,9 +2683,9 @@ { "name": "gag", "start": 62, - "end": 1601, + "end": 1600, "subtype_start": 140, - "subtype_end": 1643, + "subtype_end": 1642, "orientation": "forward", "distance": 0.7362754920106639, "protein": "MSQVNSTTVMMQKGNFRNQKKTVKCFNCGKIGHIAKNCRAPRRKGCWKCGQEGHQMKDCSERQANFLGKLWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETATPPQKQEPIDRELYSLASLKSLFGNDPSSQ", @@ -2695,9 +2695,9 @@ { "name": "pol", "start": 1393, - "end": 4405, + "end": 4404, "subtype_start": 1435, - "subtype_end": 4447, + "subtype_end": 4446, "orientation": "forward", "distance": 0.2475474244944199, "protein": "FFRETLAFPQGEAREFPSEQTRANSPTRGELQVWGRDSNSPSEAGADRQGTIFLSFPQITLWQRPLVSIKVGGQLKEALLDTGADDTVLEEMCLPGKWKPKMIGGIGGFIKVRQYDQIPIEIYGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVRLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSVNNETPGIRYQYNVLPQGWKGSPAIFQASMTKILEPFRKQNPDMVIYQYMDDLYIGSDLELGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPITLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKSLTEVVPLTREAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARIKGTHTNDVKQLTQAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKDPIVGAETFYVDGAANRDTKLGKAGYVTDRGRQKIVPLTDTTNQKTELQAIYLALQDSGSEVNIVSDSQYAIGILQAQPDKSESELVNQIIEQLIKKEKVYLTWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVNTIHTDNGSNFTSTAVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGRYSAGERIVDMIASDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSEIKVVPRRKAKIIRDYGKQMAGDDCVAGRQDED", @@ -2707,9 +2707,9 @@ { "name": "vif", "start": 4349, - "end": 4928, + "end": 4927, "subtype_start": 4391, - "subtype_end": 4970, + "subtype_end": 4969, "orientation": "forward", "distance": 0.4686663095875737, "protein": "MENRWQVMIVWQVDRMRINAWKSLVKHHMHVSRKVERWVYKHHYESTNPRISSEVHIPLGDARLKITTYWGLHTGERDWHLGQGVSIEWRKKSYNTQVDPEVADQLIHLYYFDCFSESAIRKAIVGHRVSPSCEYQAGHNKVGSLQYLALAALVKSKKTKPPLPSVTKLTEDRWNKPQRTKGRRGNHIMNGH", @@ -2719,9 +2719,9 @@ { "name": "vpr", "start": 4867, - "end": 5158, + "end": 5157, "subtype_start": 4909, - "subtype_end": 5200, + "subtype_end": 5199, "orientation": "forward", "distance": 0.4534005037783373, "protein": "MEQAPEDQGPQREPYNEWALELLEELKREAVRHFPRIWLQSLGQYVYETYGDTWTGVEAIIRILQQMLFIHFRIGCQHSRIGIIRRGRTRNGASRP", @@ -2731,9 +2731,9 @@ { "name": "tat_exon1", "start": 5138, - "end": 5357, + "end": 5356, "subtype_start": 5180, - "subtype_end": 5399, + "subtype_end": 5398, "orientation": "forward", "distance": 0.48719691819623834, "protein": "MEPVDPSLAPWKHPGSQPKTACTNCYCKKCCLHCQVCFTKKGLGISYGRKKRRQRRRPPQSSKAHQNPLPKQ", @@ -2743,21 +2743,21 @@ { "name": "rev_exon1", "start": 5277, - "end": 5358, + "end": 5354, "subtype_start": 5319, - "subtype_end": 5397, + "subtype_end": 5396, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEDLLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEDLLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEDLLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEDLLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAAGCAGTAAGGCTCATCAAAATCCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 5369, - "end": 5615, + "end": 5614, "subtype_start": 5411, - "subtype_end": 5657, + "subtype_end": 5656, "orientation": "forward", "distance": 0.46373488953730724, "protein": "MQSLQIGAIVALVVGTIIAIVVWSIVLIEYRKILRQKKIDRIIDRIVERAEDSGNESEGDQEELSALVERGHDAPWNVNDL", @@ -2767,9 +2767,9 @@ { "name": "env", "start": 5532, - "end": 8073, + "end": 8072, "subtype_start": 5574, - "subtype_end": 8124, + "subtype_end": 8123, "orientation": "forward", "distance": 0.47450452559300893, "protein": "MRVKETRKSYQHWWKGGMMLLGMLMICSAATNLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVLLGNVTEDFNAWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILHCTDVNNTRNGMTGELKNCSFNITTKITNKVQKEYALFYKLDVVPINNKDNDTSFNNNSYRLISCNTSVITQACPKVSFEPIPIHYCTPAGYAILRCNNETFSGKGPCTNVSSIQCTHGIRPVVSTQLLLNGSLAKQEVVIRSQNFSDNVKTIIVQLKTPVKINCTRPNNNTRKSIHAGPGKVIYATGEIIGDIRQAHCNISAAEWNDTLGQIVTKLQEQFGNKTIVFNQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWNNNGTNTWNSTGNITLPCKIRQIVNMWQKVGKAMYAPPIRGQIKCSSNITGLLLTRDGGNESESETFRPGGGDMRDNWRSELYKYKVVRIEPLGLAPTKAKRRVVQREKRAIGTLGAVFLGFLGTAGSTMGAASMTLTVQARQLLSGIVQQQNNLLKAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNASWSNKSLNEIWDNMTWMEWEKEISNYTQLIYTLIEESQSQQEKNEQELLALDKWDSLWSWFSITKWLWYIKIFIMIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEDGGERDRDRSTRLVTGFLPLFWDDLRSLCLFSYHRLRDLLLIAARIVELLGHRGWEILKHWWSLLQYWSQELKKSAVSLLNATAIAVAEGTDRIIEVVQRACRAILHIPVRLRQGLERALL", @@ -2779,9 +2779,9 @@ { "name": "tat_exon2", "start": 7654, - "end": 7750, + "end": 7749, "subtype_start": 7705, - "subtype_end": 7798, + "subtype_end": 7797, "orientation": "forward", "distance": 0.4464285714285715, "protein": "RPASQPRGDPTGPKESKKTVERETETDPHA", @@ -2791,9 +2791,9 @@ { "name": "rev_exon2", "start": 7655, - "end": 7940, + "end": 7939, "subtype_start": 7706, - "subtype_end": 7982, + "subtype_end": 7981, "orientation": "forward", "distance": 0.46126825660935467, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIHTLSNRILTTFLGRPEEPVPLQLPPLERLTLDCSEDCGTSGTQGVGNPQTLVESPTILESGTKKKCC", @@ -2803,9 +2803,9 @@ { "name": "nef", "start": 8074, - "end": 8695, + "end": 8694, "subtype_start": 8125, - "subtype_end": 8752, + "subtype_end": 8751, "orientation": "forward", "distance": 0.437094682230869, "protein": "MGGKWSKSSVVGWPAVRERIRRAGPAAEGVGAVSRDLDKHGAITSNNTPATNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGMIYSQQRQDILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPLETEQVEAATGGENNCLLHPLNQHGMDDPEREVLMWKFDSSLAFHHRAKELHPEYYKDC", @@ -2817,9 +2817,9 @@ { "name": "gag", "start": 683, - "end": 2183, + "end": 2182, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -2829,9 +2829,9 @@ { "name": "pol", "start": 1975, - "end": 4987, + "end": 4986, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -2841,9 +2841,9 @@ { "name": "vif", "start": 4931, - "end": 5510, + "end": 5509, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -2853,9 +2853,9 @@ { "name": "vpr", "start": 5449, - "end": 5740, + "end": 5739, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -2865,9 +2865,9 @@ { "name": "tat_exon1", "start": 5720, - "end": 5939, + "end": 5938, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -2877,21 +2877,21 @@ { "name": "rev_exon1", "start": 5859, - "end": 5940, + "end": 5936, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 5951, - "end": 6197, + "end": 6196, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -2901,9 +2901,9 @@ { "name": "env", "start": 6114, - "end": 8655, + "end": 8654, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -2913,9 +2913,9 @@ { "name": "tat_exon2", "start": 8236, - "end": 8332, + "end": 8331, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -2925,9 +2925,9 @@ { "name": "rev_exon2", "start": 8237, - "end": 8513, + "end": 8512, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -2937,9 +2937,9 @@ { "name": "nef", "start": 8656, - "end": 9271, + "end": 9270, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -2951,9 +2951,9 @@ { "name": "gag", "start": 210, - "end": 1719, + "end": 1718, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.27936962750716343, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPSLQTGSEELRSLYNTVAVLYCVHQRINVKDTKEALDTIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPISPSTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINDEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHTPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSASIMAQGGNFRNQKRNVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDKELYPLASLRSLFGNDP", @@ -2963,9 +2963,9 @@ { "name": "pol", "start": 1511, - "end": 4523, + "end": 4522, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.26443159013103534, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGQGTVSFSFPQITLWQRPIISIRIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQVPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEDKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKRKKSVTVLDVGDAYFSVPLDQDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSNGIRKILFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -2975,9 +2975,9 @@ { "name": "vif", "start": 4467, - "end": 5046, + "end": 5045, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPSLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -2987,9 +2987,9 @@ { "name": "env", "start": 4985, - "end": 8207, + "end": 8206, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.6657028690558922, "protein": "MHSFNCGGEFFYCNTTQLFNSTWNGTDNWNGTESNNTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAVGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWRQWEKEIDNYTDTIYNLIELSQNQQEQNEQDLLALDKWASLWSWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -2999,9 +2999,9 @@ { "name": "vpr", "start": 4985, - "end": 5276, + "end": 5275, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3120665742024965, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -3011,21 +3011,21 @@ { "name": "tat_exon1", "start": 5256, - "end": 5475, + "end": 5471, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.4691531785127845, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", - "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAA" + "aminoacids": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTTKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGCTTAGAGCCCTGGAAACATCCAGGAAGTCAACCTATGACTGCTTGTAACAATTGCTATTGTAAACGGTGTTGCTTTCATTGCCAAGTTTGCTTCACCACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAG" }, { "name": "rev_exon1", "start": 5395, - "end": 5476, + "end": 5475, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5290287574606619, "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", @@ -3035,9 +3035,9 @@ { "name": "vpu", "start": 5487, - "end": 5733, + "end": 5732, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5568484042553192, "protein": "MHALKIAAIVGLVVATIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", @@ -3047,9 +3047,9 @@ { "name": "tat_exon2", "start": 7788, - "end": 7881, + "end": 7880, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3059,9 +3059,9 @@ { "name": "rev_exon2", "start": 7789, - "end": 8065, + "end": 8064, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3071,9 +3071,9 @@ { "name": "nef", "start": 8208, - "end": 8850, + "end": 8849, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5432971135257649, "protein": "MGNKLSRGLRAGWPAIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTFKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHMARELHPEYFKDC", @@ -3085,9 +3085,9 @@ { "name": "gag", "start": 739, - "end": 2239, + "end": 2238, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3097,9 +3097,9 @@ { "name": "pol", "start": 2031, - "end": 5043, + "end": 5042, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3109,9 +3109,9 @@ { "name": "vif", "start": 4987, - "end": 5566, + "end": 5565, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3121,9 +3121,9 @@ { "name": "vpr", "start": 5505, - "end": 5796, + "end": 5795, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3133,9 +3133,9 @@ { "name": "tat_exon1", "start": 5776, - "end": 5995, + "end": 5994, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3145,9 +3145,9 @@ { "name": "rev_exon1", "start": 5915, - "end": 5996, + "end": 5995, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3157,9 +3157,9 @@ { "name": "vpu", "start": 6007, - "end": 6253, + "end": 6252, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3169,9 +3169,9 @@ { "name": "env", "start": 6170, - "end": 8711, + "end": 8710, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3181,9 +3181,9 @@ { "name": "tat_exon2", "start": 8292, - "end": 8388, + "end": 8387, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3193,9 +3193,9 @@ { "name": "rev_exon2", "start": 8293, - "end": 8569, + "end": 8568, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3205,9 +3205,9 @@ { "name": "nef", "start": 8712, - "end": 9327, + "end": 9326, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3219,9 +3219,9 @@ { "name": "gag", "start": 221, - "end": 1730, + "end": 1729, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2880084183556756, "protein": "MGARASVLSGGELDRWEKIYLRPGGKKKYRLKHIVWASRELERFAVNPGLLESSEGCRQILGQLQPALQTGSEELRSLYNTVAVLYCVHPRINVKDTKEALDKIEEEQNKSKKKAQQAAADTGNSSNSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINAEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNFRNQRRNVKCFNCGKEGHTAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEEATAPPQKQETKDQELYPLASLRSLFGNDP", @@ -3231,9 +3231,9 @@ { "name": "pol", "start": 1522, - "end": 4534, + "end": 4533, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.25117173416656646, "protein": "FFREDLAFPQGKAREFSPEQTRANSPASRELQVWGRGNSSPSEAGDEGPGTVSFSFPQITLWQRPIISIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALIEICAEMEKEGKITKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNEAPGVRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKENPDIVIYQYMDDLYVGSDLEIEQHRTKIEELRQHLLGWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIQLPDKDSWTINDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGAYYDPSKDLIAEVQKQGGDQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKIALEAIVIWGKTPKFKLPIQKETWEMWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVVSLMDTTNQRTELHAIHLALQDSGSTVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLAWVPAHKGIGGNEQVDKLVSSGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEPMHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIAAETGQETAYFILKLAGRWPVKIIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQISKIQNFRVYYRDSREPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKILRDYGKQMAGDDCVASRQDED", @@ -3243,9 +3243,9 @@ { "name": "vif", "start": 4478, - "end": 5057, + "end": 5056, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3903081914030819, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMHISKKAQRWVYRHHYESHNPKTSSEVHIPLGEARLVIKTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTALITPKRRKPPLPSVTKLTEDRWNKSQRTKGHKGSHTMNGH", @@ -3255,9 +3255,9 @@ { "name": "vpr", "start": 4996, - "end": 5287, + "end": 5286, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3351206434316354, "protein": "MEQVPEDQGPQREPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRTLQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -3267,9 +3267,9 @@ { "name": "tat_exon1", "start": 5267, - "end": 5486, + "end": 5485, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.48954161103693805, "protein": "MEPVDPSLEPWKHPGSQPMTACNNCYCKRCCFHCQVCFTRKGLGISYGRKKRRQRRRASHSSQNHQAALPEQ", @@ -3279,21 +3279,21 @@ { "name": "rev_exon1", "start": 5406, - "end": 5487, + "end": 5483, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5498, - "end": 5744, + "end": 5743, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5568484042553192, "protein": "MHALEIAAIVGLVVAAIIAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESDGDQEELSALVEMGHLVPWDGDDM", @@ -3303,9 +3303,9 @@ { "name": "env", "start": 5661, - "end": 8262, + "end": 8261, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5052314240113498, "protein": "MKVTGTRRSYQHLWRWGILFLGMVMICSANNLWVTVYYGVPVWKEATTTLFCASDAKAYETEKHNVWATHACVPTDPSPQEVALENVTETFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDNLNLNRPNNNTCSNNTNYNITEKGEIKNCSFNVTTGIRDRVTKEHALFYKLDVVPIDEGSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPAGFAILKCKDKKFNGTGECRNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPGRAFYGTDIIGDIRQAHCNISGKDWNDTLKQIVIKLKEKFENKTIVFTQSSGGDPEIVMHSFNCGGEFFYCNTTQLFNSTWNNSTWNGTDNWNGTESNSTITLPCRIKQIINLWQEVGRAMYAPPIQGQIRCSSNITGLLLVRDGGSNNSSNDTETFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTHAKRRVVQREKRAIGLGAFFLGFLGAAGSTMGAASVTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLALERYLKDQQLLGIWGCSGKLICTTNVPWNISWSPRWNRSLDEIWTNMTWKQWEKEIDNYTDIIYNLIEQSQNQQEQNEQDLLALDKWASLWNWFDITQWLWYIKIFIMIVGGLIGLRIVFTILSIVNRVRQGYSPLSLQTLLPTQRGPDRPEGTEEGGGERDRGTSTRLVHGFLALIWDDLRSLFLFSYHRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQEIKNSAVSLLNTTAIAVAEGTDRIIEVLQRGFRAILHIPTRIRQGLERALL", @@ -3315,9 +3315,9 @@ { "name": "tat_exon2", "start": 7843, - "end": 7936, + "end": 7935, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPSSQPRGDPTGPKEQKKEVERETEAHPRD", @@ -3327,9 +3327,9 @@ { "name": "rev_exon2", "start": 7844, - "end": 8120, + "end": 8119, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPNPEGTRQARRNRRRRWRERQRHIHEISAWILSTHLGRPAEPVPLQLPPLERLTLDCGEDCGTSGTQGVGSTEVLVESPAVLESGNKE", @@ -3339,9 +3339,9 @@ { "name": "nef", "start": 8263, - "end": 8905, + "end": 8904, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5339772804571117, "protein": "MGNKLSRGLRAGWPTIRERMRRARPVREPEPAAAGVGAASRDLERHGALTSSNTAATNADVACLEAQQEEEEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPGPGVRFPLCFGWCFKLVPVDPDKVEEASVGENNCLLSPENLHGMEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -3353,9 +3353,9 @@ { "name": "gag", "start": 527, - "end": 2297, + "end": 2296, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.706855791962175, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSNIIMMQRGNFRNQRKTVKCFNCGKERHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLRKIWPSSKGRPRNFLQSRPEPTAPPEESFRFREETATPPQKQEPVDKEVYPLASLKSLFGNDPSSQ", @@ -3365,9 +3365,9 @@ { "name": "pol", "start": 2089, - "end": 5101, + "end": 5100, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7518376924488996, "protein": "AKIKQECGIPYNPQSQEVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDNRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIKDYGKQMAGDDCVASRQDED", @@ -3377,9 +3377,9 @@ { "name": "vif", "start": 5045, - "end": 5624, + "end": 5623, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7067546928117459, "protein": "MENRWQVMIVWQVDRMRISTWKSLVKHHMYISKKAQGWFYRHHYENPHPRISSEVHIPLGDARLVITTY", @@ -3389,9 +3389,9 @@ { "name": "vpr", "start": 5563, - "end": 5854, + "end": 5853, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", @@ -3401,9 +3401,9 @@ { "name": "tat_exon1", "start": 5563, - "end": 6052, + "end": 6051, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7571801566579635, "protein": "MEQAPEDQGPQKEPNNEWTLELLEELKREAVRHFPRTWLHGLGQHIYETYEDTWTGVGALIRILQQLLFIHFRIRCQHSRIGITRQRRARNRASRS", @@ -3413,21 +3413,21 @@ { "name": "rev_exon1", "start": 5973, - "end": 6054, + "end": 6050, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", - "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSSE", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGTGAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEDLLKTVRLIKYLYQSS", + "aminoacids": "MAGRSGDSDEDLLKTVRLIKYLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTACCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 6065, - "end": 6311, + "end": 6310, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7521692502681095, "protein": "MQSLYILTIVALVVAAILAIVV", @@ -3437,9 +3437,9 @@ { "name": "env", "start": 6228, - "end": 8799, + "end": 8798, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7471048806788873, "protein": "MTNCTFNITTSIKDKIKKEAALFYKIDLVEIDEKKNNSSTRYRLINCNTSAITQACPKVSFKPIPIHFCAPASFAILKCNNKKFSGKGPCTNVSTVQCTHRIKPVVSTQLLLNGSLAEEEVMIRSDNITDNTKNIIVQLKEAIRIFCIRPNNNTRKSINIRPGRAFYTTGDIIRDIRQAHCNISGNWSNTLKQIATQLGKQLNQTQQIIFNSSAGKDPEIVTHSFNCGKKFFYCNSSSLFNST", @@ -3449,9 +3449,9 @@ { "name": "nef", "start": 8194, - "end": 9451, + "end": 9450, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.6514772974147296, "protein": "MTYKAALDLSHFLKEKGGLEGLVYSQKRQDILDLWIYHTQGYFPDWQNYTPGPRIRYPLTFGWCFKLVPLEPDQVEEANEGENNSLLHPLSQHRMDDPEKEVLVWRFDSRLAFHHMAREKHPEFYKDC", @@ -3461,9 +3461,9 @@ { "name": "tat_exon2", "start": 8380, - "end": 8476, + "end": 8475, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6995153473344102, "protein": "RPSSQPREEPTGPKE", @@ -3473,9 +3473,9 @@ { "name": "rev_exon2", "start": 8381, - "end": 8657, + "end": 8656, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.5716671727907683, "protein": "RERQRQIRSISERILSTYLGRSTEPMPLQLPPLERLTLDCDQDCGTSKTQEVRSPQILVESPAVLESGTKE", @@ -3487,9 +3487,9 @@ { "name": "gag", "start": 746, - "end": 2246, + "end": 2245, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3499,9 +3499,9 @@ { "name": "pol", "start": 2038, - "end": 5050, + "end": 5049, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3511,9 +3511,9 @@ { "name": "vif", "start": 4994, - "end": 5573, + "end": 5572, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3523,9 +3523,9 @@ { "name": "vpr", "start": 5512, - "end": 5803, + "end": 5802, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3535,9 +3535,9 @@ { "name": "tat_exon1", "start": 5783, - "end": 6002, + "end": 6001, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3547,21 +3547,21 @@ { "name": "rev_exon1", "start": 5922, - "end": 6003, + "end": 5999, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKILYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKILYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 6014, - "end": 6260, + "end": 6259, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3571,9 +3571,9 @@ { "name": "env", "start": 6177, - "end": 8718, + "end": 8717, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3583,9 +3583,9 @@ { "name": "tat_exon2", "start": 8299, - "end": 8395, + "end": 8394, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3595,9 +3595,9 @@ { "name": "rev_exon2", "start": 8300, - "end": 8576, + "end": 8575, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3607,9 +3607,9 @@ { "name": "nef", "start": 8719, - "end": 9334, + "end": 9333, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3621,9 +3621,9 @@ { "name": "gag", "start": 695, - "end": 2195, + "end": 2194, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3633,9 +3633,9 @@ { "name": "pol", "start": 1986, - "end": 5004, + "end": 5003, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.6033592883813991, "protein": "YGKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3645,9 +3645,9 @@ { "name": "vif", "start": 4948, - "end": 5527, + "end": 5526, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3657,9 +3657,9 @@ { "name": "vpr", "start": 5466, - "end": 5757, + "end": 5756, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3669,9 +3669,9 @@ { "name": "tat_exon1", "start": 5737, - "end": 5956, + "end": 5955, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3681,9 +3681,9 @@ { "name": "rev_exon1", "start": 5876, - "end": 5957, + "end": 5956, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3693,9 +3693,9 @@ { "name": "vpu", "start": 5968, - "end": 6214, + "end": 6213, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3705,9 +3705,9 @@ { "name": "env", "start": 6131, - "end": 8672, + "end": 8671, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4585964351370794, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEVHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRDKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLDQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3717,9 +3717,9 @@ { "name": "tat_exon2", "start": 8253, - "end": 8349, + "end": 8348, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3729,9 +3729,9 @@ { "name": "rev_exon2", "start": 8254, - "end": 8530, + "end": 8529, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3741,9 +3741,9 @@ { "name": "nef", "start": 8673, - "end": 9288, + "end": 9287, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4690990320178705, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDNEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3755,9 +3755,9 @@ { "name": "gag", "start": 817, - "end": 2317, + "end": 2316, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3767,9 +3767,9 @@ { "name": "pol", "start": 2109, - "end": 5121, + "end": 5120, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3779,9 +3779,9 @@ { "name": "vif", "start": 5065, - "end": 5644, + "end": 5643, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3791,9 +3791,9 @@ { "name": "vpr", "start": 5583, - "end": 5874, + "end": 5873, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3803,9 +3803,9 @@ { "name": "tat_exon1", "start": 5854, - "end": 6073, + "end": 6072, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", @@ -3815,9 +3815,9 @@ { "name": "rev_exon1", "start": 5993, - "end": 6074, + "end": 6073, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3827,9 +3827,9 @@ { "name": "vpu", "start": 6085, - "end": 6331, + "end": 6330, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3839,9 +3839,9 @@ { "name": "env", "start": 6248, - "end": 8789, + "end": 8788, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3851,9 +3851,9 @@ { "name": "tat_exon2", "start": 8370, - "end": 8466, + "end": 8465, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3863,9 +3863,9 @@ { "name": "rev_exon2", "start": 8371, - "end": 8647, + "end": 8646, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -3875,9 +3875,9 @@ { "name": "nef", "start": 8790, - "end": 9405, + "end": 9404, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -3889,9 +3889,9 @@ { "name": "gag", "start": 687, - "end": 2187, + "end": 2186, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2967573174581697, "protein": "MGARASILSGGKLDEWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -3901,9 +3901,9 @@ { "name": "pol", "start": 1979, - "end": 4991, + "end": 4990, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19298018391400085, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -3913,9 +3913,9 @@ { "name": "vif", "start": 4935, - "end": 5514, + "end": 5513, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -3925,9 +3925,9 @@ { "name": "vpr", "start": 5453, - "end": 5744, + "end": 5743, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -3937,21 +3937,21 @@ { "name": "tat_exon1", "start": 5724, - "end": 5943, + "end": 5939, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5863, - "end": 5944, + "end": 5943, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -3961,9 +3961,9 @@ { "name": "vpu", "start": 5955, - "end": 6201, + "end": 6200, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -3973,9 +3973,9 @@ { "name": "env", "start": 6118, - "end": 8659, + "end": 8658, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4620723847297967, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTSEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDKDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -3985,9 +3985,9 @@ { "name": "tat_exon2", "start": 8240, - "end": 8336, + "end": 8335, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -3997,9 +3997,9 @@ { "name": "rev_exon2", "start": 8241, - "end": 8517, + "end": 8516, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4009,9 +4009,9 @@ { "name": "nef", "start": 8660, - "end": 9275, + "end": 9274, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4023,9 +4023,9 @@ { "name": "gag", "start": 555, - "end": 2055, + "end": 2054, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4035,9 +4035,9 @@ { "name": "pol", "start": 1847, - "end": 4859, + "end": 4858, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4047,9 +4047,9 @@ { "name": "vif", "start": 4803, - "end": 5382, + "end": 5381, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4059,9 +4059,9 @@ { "name": "vpr", "start": 5321, - "end": 5612, + "end": 5611, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4071,21 +4071,21 @@ { "name": "tat_exon1", "start": 5592, - "end": 5811, + "end": 5807, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5731, - "end": 5812, + "end": 5811, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4095,9 +4095,9 @@ { "name": "vpu", "start": 5823, - "end": 6069, + "end": 6068, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAKDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4107,9 +4107,9 @@ { "name": "env", "start": 5986, - "end": 8527, + "end": 8526, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4581222593756883, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVEKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4119,9 +4119,9 @@ { "name": "tat_exon2", "start": 8108, - "end": 8204, + "end": 8203, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4131,9 +4131,9 @@ { "name": "rev_exon2", "start": 8109, - "end": 8385, + "end": 8384, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4143,9 +4143,9 @@ { "name": "nef", "start": 8528, - "end": 9143, + "end": 9142, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPMSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4157,9 +4157,9 @@ { "name": "gag", "start": 246, - "end": 1782, + "end": 1781, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.35613851839948674, "protein": "MGARASVLSGGELDKWEKIRLRPGGRKRYKLKHIVWASRELERFAVNPGLLETSEGCKQIMGQLQPALQTGSEELRSLYNTVAVLYCVHQRIDVKDTKEALDKIEEEQNKSKKKTQQAAAADTGNNSQVSQNYPIVQNMQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVQAGPVAPGQIREPRGSDIAGTTSTLQEQIAWMTHNPPVPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKGWMTETLLVQNANPDCKTILKALGPGATLEEMMTACQGVGGPSHKARVLAEAMSQATGAHAIMMQRGNFKNQRKTVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESLRPTAPPVESFRFGEETAAPFQKQEPRDKEMSPLASLKSLFGNDQ", @@ -4169,9 +4169,9 @@ { "name": "pol", "start": 1544, - "end": 4586, + "end": 4585, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.24526399193257942, "protein": "FFRENLAFPQGKAGEFPSEQTRANSPTRGEPQANSPTSRELQVWGRDSSPLSEAGTERQGDVSLSFPQITLWQRPVVTIKIGGQIKEALLDTGADDTVLEEMALPGRWKPKMIGGIGGFIKVRQYDQIAIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKIKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPIFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSITVLDVGDAYFSVPLDEEFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRTKIEELRGHLLKWGFTTPDKKHQKEPPFLWMGYELHPDRWTVQPIKLPEKEIWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTEEAELELAENREILKEPVHGVYYDPTKELIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKISTESIVIWGKTPKFKLPIQKETWEIWWTDYWQATWIPEWEFVSTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYITDRGRQKVVTLNDTTNQKTELQAILLALQDSGLEANIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKIYLTWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDRAQEEHERYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQIDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGVKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQISKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4181,9 +4181,9 @@ { "name": "vif", "start": 4530, - "end": 5109, + "end": 5108, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMYVSKKTKGWFYRHHYESTHPKISSEVHIPLGDAELVVTTYWGLQPGERDWHLGQGVSIEWRKGRYRTHVDPNLADQLIHLHYFDCFSESAIRHAILGHRVSPRCEYQAGHNKVGSLQYLALAALRAPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4193,9 +4193,9 @@ { "name": "vpr", "start": 5048, - "end": 5339, + "end": 5338, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKQEAVRHFPRPWLHSLGQYIYETYGDTWAGVEAIIRMLQQLLFIHFRIGCQHSRIGIIPQRRARNGSSRS", @@ -4205,21 +4205,21 @@ { "name": "tat_exon1", "start": 5319, - "end": 5538, + "end": 5534, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.5237430167597767, "protein": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", - "aminoacids": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ*", - "nucleotides": "ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAGTAA" + "aminoacids": "MDPVDPNLEPWKHPGSQPKTACNNCYCKKCCLHCQVCFTRKGLGISYGRKKRRRRRGSLKGRQAHQDSLSKQ", + "nucleotides": "ATGGATCCAGTAGATCCTAACCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAGACTGCTTGTAACAATTGCTATTGTAAAAAGTGTTGCCTTCATTGCCAAGTTTGTTTCACACGAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACGGAGACGAGGATCTCTTAAAGGCCGTCAGGCTCATCAAGACTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5458, - "end": 5539, + "end": 5538, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.5622384937238494, "protein": "MAGRSGDGDEDLLKAVRLIKTLYQSSK", @@ -4229,9 +4229,9 @@ { "name": "vpu", "start": 5550, - "end": 5808, + "end": 5807, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.6039004707464695, "protein": "MLSLEVIVAITALVVAGIIAIVVWTIVLIEYRKILRQRKIDKILDRIRERAEDSGNESEGDQEELSALVEMGHNAHHAPWDIND", @@ -4241,9 +4241,9 @@ { "name": "env", "start": 5716, - "end": 8257, + "end": 8256, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5196110433453024, "protein": "MRVRGIRKNCQRLWRWGTMLTMLLGILMISNATEQLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEMVLINVTENFNMWKNDMVDQMQEDIVSLWDQSLKPCVKLTPLCVTLNCTNLTIEPNNATKANISGRLEGKGEMTNCSFNVTTSLRDKRKKEYALFYKLDVVATGENNNSFRLISCNTSEITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGKCNNVSIVQCTHGIRPVVSTQLLLNGSLAEEEVVVRSANFSDNTKTIIVQLNKTVVINCTRPNNNTRRSIHIAPGRAFYATGDIIGDIRKAHCNISKEDWNTTLNQVAKKLQEQFENATIDFKPSSGGDPEIVMHSFNCGGEFFYCNTTELFSWNATTKLFTWNATNSNNGTIILPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGTNGTGNRNETFRPGGGNMKDNWRSELYKYKVVEIKPLGVAPTKAKRRVVQREKRAVTIGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNISWSNRTLNNIWDNLTWMQWDTEINNYTNKIYQLLEEAQNQQEKNEQELLELDKWANLWNWFDISNWLWYIKIFILIVGGLIGLRIVFTVLSIVNRVRQGYSPLSFQTRFPVPRGPDRPEGTEEEGGERDRDRSDRLVNGFLTLIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNVLQYWSQELKNSAVSLLNATAIVVAEGTDRIIELAQRICRAE", @@ -4253,9 +4253,9 @@ { "name": "tat_exon2", "start": 7874, - "end": 7970, + "end": 7969, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPASQSRGDPTGPKEPKKKVERETETDPTD", @@ -4265,9 +4265,9 @@ { "name": "rev_exon2", "start": 7875, - "end": 8151, + "end": 8150, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRQISERILDTYLGRSEEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSTQILVECPAILESGTKE", @@ -4277,9 +4277,9 @@ { "name": "nef", "start": 8275, - "end": 8896, + "end": 8895, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4680383864671438, "protein": "MGGKWSKHSKSEWADVRERMAQTEAAADGVGAVSRDLERHGAITSSNTATNNAACAWLEAQEEEEVGFPVKPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRFPLCFGWCFKLVPVDPDKVEEANKGENNSLLHPMSLHGMEDTEREVLMWKFDSRLAFHHVAREKHPEYFKDC", @@ -4291,9 +4291,9 @@ { "name": "gag", "start": 2, - "end": 1697, + "end": 1696, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.7478034493979825, "protein": "MTETLLVQNANPDCKTILKALRPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTKSASIMVQGGNLKNQRKNVKCFNCGKEGHTAKNCRAPKKKGC", @@ -4303,9 +4303,9 @@ { "name": "pol", "start": 1489, - "end": 4501, + "end": 4500, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7624366800883231, "protein": "KPKIIEGIRGFIKVRQYDQVPIKICRHKAISTVLIRPTPVNIIRRNLLTQLSCTLNFPISPIETVPVKLKPGIDSPKVKQWPLTEEKIKALIEICAEIEKERKITKIRPKNPYNTPVFAIKKKDSTK", @@ -4315,9 +4315,9 @@ { "name": "vif", "start": 4445, - "end": 5024, + "end": 5023, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7494633160752622, "protein": "MENRWQVMIVWQVDKMRIRTWNSLVKHHMHISKKAQR", @@ -4327,9 +4327,9 @@ { "name": "vpr", "start": 4963, - "end": 5254, + "end": 5253, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.4464285714285715, "protein": "MEQVPEDQRPQKEPYNEWTLELLEELKSEAVRHFPRPWLHSLGQYIYETYGDTWAEVEAIIRTLQQLLFIHFRIRCQHSRIRIIRQRRARNRASRS", @@ -4339,9 +4339,9 @@ { "name": "tat_exon1", "start": 5111, - "end": 5453, + "end": 5452, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.6409453748630458, "protein": "MTACNNCYCKRCCFHCQVCFTRKGLGISHGRKKRRQRRRASHSSQNHQAALPEQ", @@ -4351,21 +4351,21 @@ { "name": "rev_exon1", "start": 5373, - "end": 5454, + "end": 5450, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.5290287574606619, - "protein": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGTAAG" + "distance": 0.4886988393402566, + "protein": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "aminoacids": "MAGRSGDSDEELLTAVRIIKRLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCACAGCAGTCAGAATCATCAAGCGGCTCTACCAGAGCAGT" }, { "name": "vpu", "start": 5465, - "end": 5711, + "end": 5710, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7521692502681095, "protein": "MHALEIAAIVRLVVAAIIAIVV", @@ -4375,9 +4375,9 @@ { "name": "env", "start": 5628, - "end": 8229, + "end": 8228, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7513561129398668, "protein": "MTEEGEIKNCSFNVTTGIRDKVTKEHALFYKLDVVPIDESSGNTTGKYRMINCNTSVITQACPKVSFEPIPIHFCAPASFAILKCKDKKFNRTGECRNVSTVQCTHRIRPVVSTQLLLNGSLAEEEIVIRSANLSNNAKTIIVQLNKSVKINCTRPNNNTRRSIHIGPRRAFYRTDIIGDIRQAHCNISRKD", @@ -4387,9 +4387,9 @@ { "name": "nef", "start": 7624, - "end": 8872, + "end": 8871, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5833488893037148, "protein": "MRQARPVRKPEPAATKVRAASRDLERHGALTSSNTAATNADVACLEAQQEEKEVGFPVRPQVPLRPMTYKGALDISHFLKEKGGLDGLIYSKRRQDILDLWLYNTQGYFPDWQNYTPRPGVRFPLCFRWCFKLVPVDPDKVEEASVGENNCLLSPENLHRIEDEHREVLQWRFDSRLAFHHVARELHPEYYKDC", @@ -4399,9 +4399,9 @@ { "name": "tat_exon2", "start": 7810, - "end": 7903, + "end": 7902, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RPSSQPRGDPTGPKEQKKEVERKTEAHPRD", @@ -4411,9 +4411,9 @@ { "name": "rev_exon2", "start": 7811, - "end": 8087, + "end": 8086, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.6667847862036381, "protein": "ILSTHLGRPAEPVPLQLPPLERLTLDCGEDCRTSKTQKVRSTEVLVESPAVLESGNKE", @@ -4425,9 +4425,9 @@ { "name": "gag", "start": 549, - "end": 2049, + "end": 2048, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDSWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSVNVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4437,9 +4437,9 @@ { "name": "pol", "start": 1841, - "end": 4853, + "end": 4852, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVHQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4449,9 +4449,9 @@ { "name": "vif", "start": 4797, - "end": 5376, + "end": 5375, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.378905844492889, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVNPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4461,9 +4461,9 @@ { "name": "vpr", "start": 5315, - "end": 5606, + "end": 5605, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4473,21 +4473,21 @@ { "name": "tat_exon1", "start": 5586, - "end": 5805, + "end": 5801, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5725, - "end": 5806, + "end": 5805, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4497,9 +4497,9 @@ { "name": "vpu", "start": 5817, - "end": 6063, + "end": 6062, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5278361344537815, "protein": "MQPLHIAAIVGLVVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4509,9 +4509,9 @@ { "name": "env", "start": 5980, - "end": 8521, + "end": 8520, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.46021436825118545, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTTESHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSKEGKMAEEMRNCSFNITTEIRNKMQKEYALFYKLDVVPIDDDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKSVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYGNKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSGTETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4521,9 +4521,9 @@ { "name": "tat_exon2", "start": 8102, - "end": 8198, + "end": 8197, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4533,9 +4533,9 @@ { "name": "rev_exon2", "start": 8103, - "end": 8379, + "end": 8378, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.40871934604904625, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVSLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4545,9 +4545,9 @@ { "name": "nef", "start": 8522, - "end": 9137, + "end": 9136, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGVEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4559,9 +4559,9 @@ { "name": "gag", "start": 468, - "end": 1968, + "end": 1967, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3014827756125966, "protein": "MGARASILSGGKLDAWEKIRLRPGGKKKYRLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELKSLFNAVAVLYCVHQRIQVQDTKEALEKVEEEQNKSKKKAQQVAAADTDTGNSSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWTTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYRTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVNSANVMMQRGNFRNQRKIVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETITPSQKQEPRDKELYPLSSLKSLFGSDPSSE", @@ -4571,9 +4571,9 @@ { "name": "pol", "start": 1760, - "end": 4772, + "end": 4771, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19610372855115465, "protein": "FFRENLAFPQRKARELPSEQTRANSPTRRELQVWGRDNNSLSEAGAKRQGTVSLVFPQITLWQRPLVRIKIGGQFKEALLDTGADDTVLEEMSLPGKWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLIGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKEFRKYTAFTIPSTNNETPGIRYEYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIILPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTEEAELELAENREILREPVHGVYYDPSKDLIAEVQKQGNGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWAEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDRGRQKVISLTDTTNQKTELQAIYLALQDSGSEVNIVTDSQYTLGIIQAQPDKSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSTGVRRVLFLDGIDKAQEDHEKYHSNWRAMAGDFNIPPVVAKEIVASCDKCQQKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDLQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4583,9 +4583,9 @@ { "name": "vif", "start": 4716, - "end": 5295, + "end": 5294, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.36908151428872715, "protein": "MANRWQVMIVWQVDRMRIRTWNSLVKHHMHVSKKTKGWFYRHHYESTHPRISSEVHIPLGDARLVVTTYWGLNTGEREWHLGQGVSIEWRKRKYSTQVDPNLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALKALTTPKRRKPPLPSVRKLTEDRWNEHQKTKGHRGSHTMNGH", @@ -4595,9 +4595,9 @@ { "name": "vpr", "start": 5234, - "end": 5525, + "end": 5524, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.31767642387111417, "protein": "MERAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHGLGQHIYETYGDTWTGVEAIIRTLQQLLFIHFRLGCRHSRIGIVPQRRARNGASRS", @@ -4607,21 +4607,21 @@ { "name": "tat_exon1", "start": 5505, - "end": 5724, + "end": 5720, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRAPQGSQTDQDSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5644, - "end": 5725, + "end": 5724, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELLKAVRLIKILYQSSK", @@ -4631,9 +4631,9 @@ { "name": "vpu", "start": 5736, - "end": 5982, + "end": 5981, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5399181166837258, "protein": "MQPLHIAAIVGLIVAAIIAIVVWTIVLIEYRKILRQKRIDRLIDRIRERAEDSGNESEGDQEELSALMEMGHHAPGDVDDL", @@ -4643,9 +4643,9 @@ { "name": "env", "start": 5899, - "end": 8440, + "end": 8439, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4583799776107468, "protein": "MRVKGIRKNCQRLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEANTTLFCASDAKAYTPEAHNVWATHACVPTDPNPQEVGLENVTENFNMWKNNMVEQMHEDVINLWDQSLKPCVKLTPLCVTLNCTNLNVTNTNSSSEEGKMAEEMRNCSFNITTKIRNKMQKEYALFYKLDVVPIDNDNTSYTLINCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCKDKKFNGSGPCKNVSTVQCTHGIKPVVSTQLLLNGSLAEEEVVIRSENFTNNAKTIIVHLKEPIQINCTRPNNNTMKSIPLGPGRAFYATGAIIGDIRQAHCNLSRKAWNNTLKQVVEKLKEQYENKTIIFNHSSGGDPEIIMHTFNCGGEFFYCNTTQLFNSTWNSTWTGNATELDGNITLPCRIKQIINRWQEVGKAMYAPPIRGKIRCSSNITGLLLVRDGGNTSETETFRPGGGDMKDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLQDQQRLGIWGCSGKLICTTAVPWNASWSNKSLNQIWDNMTWMEWEREINNYTDTIYTLIEKAQNQQEKNEQELLELDKWASLWNWFNITKWLWYIKLFIMIVGGLIGLRIVFAVLAIVNRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSVRLVNGFLALFWDDLRSLCLFLCHRLRDLLLIVTRIVELLGRRGWEILKHWWSLLQYWIQELKSSAISLFNVTAIAVAEGTDRVIEVVQRACRALLHIPTRIRQGLERALL", @@ -4655,9 +4655,9 @@ { "name": "tat_exon2", "start": 8021, - "end": 8117, + "end": 8116, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.32608695652173914, "protein": "RPTSQPRGDPTGPKESKKKVEKETETDQFD", @@ -4667,9 +4667,9 @@ { "name": "rev_exon2", "start": 8022, - "end": 8298, + "end": 8297, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSPEGTRQARRNRRRRWRKRQRQISSISERILGTFLGRPAEPVPLPLPPLERLTLDCNKDCGTSGTQGVGNPQTLVESPAVLDSGAKE", @@ -4679,9 +4679,9 @@ { "name": "nef", "start": 8441, - "end": 9056, + "end": 9055, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4624277456647399, "protein": "MGGKWSKSSGGGWPAVRERMRRTEPAAEGVGAVSRDLERHGAVTSSNTAATNADCAWLEAQEEDSEVGFPVRPQVPLRPMTFKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVYNTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPEEANQGENNCLLHPTSLHGMEDPEKEVLMWKFDSRLAFHHMAREKHPEYYKDC", @@ -4693,9 +4693,9 @@ { "name": "gag", "start": 825, - "end": 2361, + "end": 2360, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2559303794507086, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPSLLETAEGCRQILGQLQPSLQTGSEELKSLYNTLATLYCVHQRIEVKDTKEALEKIEEEQNKSKKKAQQAAADTGNSSQVRHTGNSSQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTSNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSHVTNSSAIMMQRGNFRNQRKAVKCFNCGKEGHIAKNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPPEEIFRFVEETTTPSQKQEPIDKELYPPLASLKSLFGNDPSSQ", @@ -4705,9 +4705,9 @@ { "name": "pol", "start": 2147, - "end": 5165, + "end": 5164, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.19193360134872262, "protein": "FFRENLAFPQRKAREFSPEQTRANSPTTRRDLQVCGRDNNSLSETGANRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGRWKPKMIGGIGGFIKVRQYDQIPIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPYRTRNPEMVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPNKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGEGQWTFQIYQEPFKNLKTGKYARARGAHTNDVKQLTEAVQKIATEGIVIWGKIPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKKGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAIHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQIIKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4717,9 +4717,9 @@ { "name": "vif", "start": 5109, - "end": 5688, + "end": 5687, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.24677296886864086, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHMYVSRKAKGWFYRHHFESNHPKISSEVHIPLEDARLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPDLADQLIHLYYFDCFSESAIRNAILGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKRKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4729,9 +4729,9 @@ { "name": "vpr", "start": 5627, - "end": 5918, + "end": 5917, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHSLGQYIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRARNGASRS", @@ -4741,21 +4741,21 @@ { "name": "tat_exon1", "start": 5898, - "end": 6117, + "end": 6113, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPRTACTTCYCKKCCFHCQVCFTTKGLGISYGRKKRRQRRRAPQDSQTDQGPLPKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGGCTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTGCTTGTACCACTTGTTATTGTAAAAAATGCTGCTTTCATTGCCAAGTTTGTTTCACAACAAAAGGCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGACGAGCTCCTCAAGACAGTCAGACTGATCAAGGTCCTCTACCAAAGCAG" }, { "name": "rev_exon1", "start": 6037, - "end": 6118, + "end": 6117, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDDELLKTVRLIKVLYQSSK", @@ -4765,9 +4765,9 @@ { "name": "vpu", "start": 6129, - "end": 6375, + "end": 6374, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5077548005908421, "protein": "MQPLTILAIVALVVAAILAIVVWSIVLIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSALVERGHLAPWNVDDL", @@ -4777,9 +4777,9 @@ { "name": "env", "start": 6292, - "end": 8875, + "end": 8874, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.48559709145147756, "protein": "MKVRGIRKNYQHWWRGGILLLGMLMICNATEQQLWVTVYYGVPVWKEANTTLFCASDAKAYSTEVHNVWATHACVPTDPNPQEVVLKNVTENFNMWENNMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNTTRSSGNTTNEMKNCSFYTETDIRDKKRKEYALFYELDIVPIDEDNKNKSNNISYSRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEDEVVIKSSNFTNNAKTIIVQLNETVKINCTRPNNNTRKSIPIGPGRAFYATGDIIGDIRQAHCNISRANWTNTLKQIAEKLGKQFEENKTIVFNPSSGGDPEVVMHSFNCRGEFFYCNSTPLFNSTWKETNGIWTRIGESNDSATITLNDSDTITLQCKIRQIINLWQEVGKAMYAPPIKGQISCLSNITGLLLVRDGGNNTNGTEIFRPVGGEMRDNWRSELYKYKVVKIEPLGVAPTRAKRRVVQREKRATLGALFLGFLGAAGSTMGAASVTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLRDQQLLGIWGCSGKLICTTTVPWNTSWSNKSLEKIWNNMTWMEWEREIDNYTSLIYTLLEESQNQQEKNEKELLELDTWASLWNWFDITNWLWYIKIFIMIIGGLVGLRIVFTVLSIVNRVRQGYSPLSFQIHPPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLALFWVDLRSLCLFSYHRLRDLLLIVARIVELLGRRGWEALKYGWSLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEILQRACRAILHIPTRIRQGLERALL", @@ -4789,9 +4789,9 @@ { "name": "tat_exon2", "start": 8456, - "end": 8552, + "end": 8551, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.5303030303030303, "protein": "RSTPQLRGDPTGPKESKEKVERETETDPVH", @@ -4801,9 +4801,9 @@ { "name": "rev_exon2", "start": 8457, - "end": 8733, + "end": 8732, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.3690449563855961, "protein": "DPPPSSEGTRQARRNRRRRWRERQRQIRSISERILSTFLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGSSQIRVESPTILEPGTKE", @@ -4813,9 +4813,9 @@ { "name": "nef", "start": 8876, - "end": 9509, + "end": 9508, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.411658382286489, "protein": "MGGKWSKSKLFGWPAVRERMRRAEPAAEPAADGVGAASRDLERHGAITSSNTPTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSPKRQEILDLWVYHTQGFFPDWDNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNCLLHPMSQHGMEDPEREVLEWRFDSRLAFRHVARELHPEYYKDC", @@ -4827,9 +4827,9 @@ { "name": "gag", "start": 801, - "end": 2313, + "end": 2312, "subtype_start": 140, - "subtype_end": 1643, + "subtype_end": 1642, "orientation": "forward", "distance": 0.2589641434262949, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKTQQAAADTGNNSQTSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNFRNQRKNVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPVDKELYPLASLRSLFGNDPSSQ", @@ -4839,9 +4839,9 @@ { "name": "pol", "start": 2105, - "end": 5117, + "end": 5116, "subtype_start": 1435, - "subtype_end": 4447, + "subtype_end": 4446, "orientation": "forward", "distance": 0.14797358397500882, "protein": "FFRENLAFPQGEAREFSSEQTRANSPTRRELQVWGGDNNSLSEAGAGRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVTTIHTDNGSNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4851,9 +4851,9 @@ { "name": "vif", "start": 5061, - "end": 5640, + "end": 5639, "subtype_start": 4391, - "subtype_end": 4970, + "subtype_end": 4969, "orientation": "forward", "distance": 0.32379004771642805, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSIHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKERYSTQVDPGLADQLIHRYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4863,9 +4863,9 @@ { "name": "vpr", "start": 5579, - "end": 5870, + "end": 5869, "subtype_start": 4909, - "subtype_end": 5200, + "subtype_end": 5199, "orientation": "forward", "distance": 0.34013605442176864, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAITRILQQLLFIHFRIGCQHSRIGIIQRRRARNGTSRS", @@ -4875,9 +4875,9 @@ { "name": "tat_exon1", "start": 5850, - "end": 6069, + "end": 6068, "subtype_start": 5180, - "subtype_end": 5399, + "subtype_end": 5398, "orientation": "forward", "distance": 0.38728632478632474, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", @@ -4887,9 +4887,9 @@ { "name": "rev_exon1", "start": 5989, - "end": 6070, + "end": 6069, "subtype_start": 5319, - "subtype_end": 5397, + "subtype_end": 5396, "orientation": "forward", "distance": 0.3620426829268293, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSSK", @@ -4899,9 +4899,9 @@ { "name": "vpu", "start": 6081, - "end": 6330, + "end": 6329, "subtype_start": 5411, - "subtype_end": 5657, + "subtype_end": 5656, "orientation": "forward", "distance": 0.44033465433729635, "protein": "MQPLEISAIVALVVAIIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", @@ -4911,9 +4911,9 @@ { "name": "env", "start": 6244, - "end": 8827, + "end": 8826, "subtype_start": 5574, - "subtype_end": 8124, + "subtype_end": 8123, "orientation": "forward", "distance": 0.44564023273792597, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFYASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNTTSTKNTTPSTTASSGERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKKFNGSGPCTNVSTIQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKTIIVHLKDSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSSWKDESNGTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLITRDGGKNNESNTTEIFRPEGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKTLEQIWDNMTWMQWEREIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHPPAPRGPDRPEGIGEEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLNIPRRIRQGLERALL", @@ -4923,9 +4923,9 @@ { "name": "tat_exon2", "start": 8408, - "end": 8504, + "end": 8503, "subtype_start": 7705, - "subtype_end": 7798, + "subtype_end": 7797, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPTPQPRGDPTGQKESEKKVERETETDPDH", @@ -4935,9 +4935,9 @@ { "name": "rev_exon2", "start": 8409, - "end": 8685, + "end": 8684, "subtype_start": 7706, - "subtype_end": 7982, + "subtype_end": 7981, "orientation": "forward", "distance": 0.3471418653089562, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", @@ -4947,9 +4947,9 @@ { "name": "nef", "start": 8828, - "end": 9461, + "end": 9460, "subtype_start": 8125, - "subtype_end": 8752, + "subtype_end": 8751, "orientation": "forward", "distance": 0.33768732280275404, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -4961,9 +4961,9 @@ { "name": "gag", "start": 855, - "end": 2358, + "end": 2357, "subtype_start": 200, - "subtype_end": 1700, + "subtype_end": 1699, "orientation": "forward", "distance": 0.38383718162342295, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPSLQTGSEELKSLYNTVATLYCVHQQIDVKDTKEALDKIEEEQNKSKKKVQQAATDTGNNSQASQNYPIVQNLQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGAIMMQRGNFRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPAESFRFGEETTTPSQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -4973,9 +4973,9 @@ { "name": "pol", "start": 2150, - "end": 5162, + "end": 5161, "subtype_start": 1492, - "subtype_end": 4504, + "subtype_end": 4503, "orientation": "forward", "distance": 0.21863141758600757, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTSRELQVRGGDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIDELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCRLLKGTKALTEVVPLTREAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQRETWDTWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -4985,9 +4985,9 @@ { "name": "vif", "start": 5106, - "end": 5685, + "end": 5684, "subtype_start": 4448, - "subtype_end": 5027, + "subtype_end": 5026, "orientation": "forward", "distance": 0.3589413907639558, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISKKAKGWIYKHHYDSINPKISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPGLADRLIHLYYFDCFSESAIRNAILGRIVSPSCDYQAGHNKVGSLQYLALTALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -4997,9 +4997,9 @@ { "name": "vpr", "start": 5624, - "end": 5915, + "end": 5914, "subtype_start": 4966, - "subtype_end": 5257, + "subtype_end": 5256, "orientation": "forward", "distance": 0.2400808693454637, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCQHSRIGILQRRRARNGASRS", @@ -5009,9 +5009,9 @@ { "name": "tat_exon1", "start": 5895, - "end": 6114, + "end": 6113, "subtype_start": 5237, - "subtype_end": 5456, + "subtype_end": 5455, "orientation": "forward", "distance": 0.2515090543259557, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAHQDSQTHQASLSKQ", @@ -5021,9 +5021,9 @@ { "name": "rev_exon1", "start": 6034, - "end": 6115, + "end": 6114, "subtype_start": 5376, - "subtype_end": 5454, + "subtype_end": 5453, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEELIKTVRLIKLLYQSSK", @@ -5033,9 +5033,9 @@ { "name": "vpu", "start": 6126, - "end": 6375, + "end": 6374, "subtype_start": 5468, - "subtype_end": 5708, + "subtype_end": 5707, "orientation": "forward", "distance": 0.3726554787759131, "protein": "MQPLVISAIVALVVVAIIAIVVWSIVLIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVNDL", @@ -5045,9 +5045,9 @@ { "name": "env", "start": 6289, - "end": 8881, + "end": 8880, "subtype_start": 5631, - "subtype_end": 8208, + "subtype_end": 8207, "orientation": "forward", "distance": 0.48107374453325313, "protein": "MRARGIRKNYQHLLWRWGTMLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTGANNTTSTNTTTPSTTVSSEERMGEGEIKNCSFNITTSLRDKMQKEYALFYRPDIVPIDNTSYRLISCNTSVITQACPKVTFEPIPIHYCAPAGFAILKCNNKTFNGSGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEIVIRSENFSDNAKNIIVHLNKSVEITCIRPNNNTRKSIPMGPGKAFFATGAIIGDIRQAHCKINKTKWNNTLEQVFKKLREQFGNNKTIIFNHSSGGDPEIVTHNFNCGGEFFYCNTSKLFNSTWNETSYWKGEGSNNDTITLPCRIKQIINLWQEVGKAMYAPPIRGLIKCSSNITGLLLTRDGGNESETTDTETFRPVGGNMKDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGLGAMFLGFLGAAGSTMGAASITLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKNLTQIWDNMTWMQWEKEIDNYTSLIYTLIEESQNQQEKNELELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEGEGGERDRDRSGPLVNGFLAIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRGGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", @@ -5057,9 +5057,9 @@ { "name": "tat_exon2", "start": 8462, - "end": 8558, + "end": 8557, "subtype_start": 7789, - "subtype_end": 7885, + "subtype_end": 7884, "orientation": "forward", "distance": 0.5337214944201844, "protein": "RPTSQPRGDPTGQKESKEKVERETETDPDH", @@ -5069,9 +5069,9 @@ { "name": "rev_exon2", "start": 8463, - "end": 8739, + "end": 8738, "subtype_start": 7790, - "subtype_end": 8066, + "subtype_end": 8065, "orientation": "forward", "distance": 0.41220115416323155, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILSNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTRGVGTPQVLVESPAVLESGTKE", @@ -5081,9 +5081,9 @@ { "name": "nef", "start": 8882, - "end": 9515, + "end": 9514, "subtype_start": 8209, - "subtype_end": 8842, + "subtype_end": 8841, "orientation": "forward", "distance": 0.3463855421686747, "protein": "MGGKWSKSSVVGWPKIRERMRRAEPAAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEEEEVGFPVRPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIYSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -5095,9 +5095,9 @@ { "name": "gag", "start": 767, - "end": 2270, + "end": 2269, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.316486214000789, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKKYQLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEELKSLFHTVATLYCVHQKIEVKDTKEALEKIEEEQKKSKKKAQQAAADTGNNSQVSQNYPIVQNMQGQMVHQPLSPRTLNAWVKVIEDKAFSPEVIPMFTALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQLREPRGSDIAGTTSNLQEQIAWMTHNPPVPVGEIYKRWILLGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQASQDVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQVANPASIMMQRGNFRNQRKPIKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKVWPSRKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKPEPIDKELYPLASLRSLFGNDPSSQ", @@ -5107,9 +5107,9 @@ { "name": "pol", "start": 2062, - "end": 5074, + "end": 5073, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1943357603710517, "protein": "FFREGLAFPQGEAREFPSEQTRANSPTRRELQVWGRDDNSLSETGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMNLPGKWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPRVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPIFAIKKKDGNKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRAKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPILLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPSKDLIAELQKQGQGQWTYQIYQEPYKNLKTGKYARMRGTHTNDIKQLTEAVQKIATESIVIWGKTPKFKLPIQKETWEAWWIEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTDKGRQKVVPLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLKGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSNVVKAACWWAGIKQEFGIPYNPQSQEVIESMNKELKKIIGQVRDQAEHLKTAVQMAVFVHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5119,9 +5119,9 @@ { "name": "vif", "start": 5018, - "end": 5597, + "end": 5596, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMHISRKAKNWLYRHHYESIHPRISSEVHIPLGDARLVITTYWGLLTGERDWHLGQGVSIEWRERRYRTQVDPDLADQLIHLYYFDCFSESAIRNALLGRVVSPRCEYQAGHNQVGSLQYLALTALITPKRRKPPLPSVRKLTEDRWNKPQKTKGHKGSHTMNGH", @@ -5131,9 +5131,9 @@ { "name": "vpr", "start": 5536, - "end": 5827, + "end": 5826, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MEQAPEDQGPQREPYNEWALELLEELKSEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGINLQRRARNGSSRS", @@ -5143,9 +5143,9 @@ { "name": "tat_exon1", "start": 5807, - "end": 6026, + "end": 6025, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.37688442211055273, "protein": "MDPVDPSLEPWKHPGSQPKTACTNCYCKKCCFHCQVCFIKKGLGISYGRKKRRQRRRASQGSETHQVSLPKQ", @@ -5155,21 +5155,21 @@ { "name": "rev_exon1", "start": 5946, - "end": 6027, + "end": 6023, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLKAVRLIKFLYQSSK", - "aminoacids": "MAGRSGDSDEELLKAVRLIKFLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLKAVRLIKFLYQSS", + "aminoacids": "MAGRSGDSDEELLKAVRLIKFLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGGCAGTGAGACTCATCAAGTTTCTCTACCAAAGCAGT" }, { "name": "vpu", "start": 6038, - "end": 6284, + "end": 6283, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5464940306036659, "protein": "MRPLEIAAIVALVVAVLIAIVVWSIVLIEYRKILRQRKIDRIVDRIRERAEDSGNESEGDQEELSALVERGHLAPWDIDDL", @@ -5179,9 +5179,9 @@ { "name": "env", "start": 6201, - "end": 8778, + "end": 8777, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5083167934238491, "protein": "MRVKGIRRNYQHWWRGGTLLLGILMICSATENLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPSPQEVVLKNVTEKFNMWKNNMVEQMHQDIISLWDESLKPCVKLTPLCVTLNCTNATISGNATEEIKNCSFNVNTKIGGKKQKERALFYKLDVVPIDDDSTNRTNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCGDKEFNGTGLCRNVSTVQCTHGIRPVVSTQLLLNGSLAEGEVVIKSENITNNVKTIIVQLNETVSINCTRPSNNTRRSIHMGPGRAFYATGEIIGDIRKAQCILNKTDWSDTLTRIAKKLHKQFHGPIAFEQSSGGDPEITMHTFNCGGEFFYCNTSALFSGTWNGTAWTNATWGNIAGNNITLQCRIKQFINRWQEVGKAMYAPPIRGEIRCSSNITGLLLTRDGGSNTTNGGENGTQIGENVTQIFRPGGGDMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVTFGALFLGFLGAAGSTMGAASMTLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLRDQQLLGIWGCSGKLICTTTVPWNASWSNKTLEKIWGNMTWMEWEREIDNYTDLIYTLIEQSQNQQEKNEQELLELDKWAGLWNWFDITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRLPASRGPDRPEGTDEEGGERDRDRSGSLVNGFLALIWIDLRSLFLFSYLRLRDLLLIAARIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNAIAISVAEGTDRIIEAIQRICRAILHIPTRIRQGLERALL", @@ -5191,9 +5191,9 @@ { "name": "tat_exon2", "start": 8359, - "end": 8455, + "end": 8454, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4034761018001243, "protein": "RPASQPRGDPTGPKEPTKKVERETETDPDH", @@ -5203,9 +5203,9 @@ { "name": "rev_exon2", "start": 8360, - "end": 8636, + "end": 8635, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.38952607660679506, "protein": "DPPPSLEGTRQARRNRRRRWRERQRQIRIISERILSTHLDRPAESVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKE", @@ -5215,9 +5215,9 @@ { "name": "nef", "start": 8779, - "end": 9406, + "end": 9405, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.5049429657794677, "protein": "MGGKGSKMRGWVAVREKMRRTKPEDEPAANGVGAASRDLEKYGALTSSNTVATNADLAWLEAQEEEEVGFPVRPQVPLRPMTYKGALDLSHFLKEKGGLEGLIYSQKRQDILDLWVHHTQGYLPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDQVEEANAGENNSLLHPMSLHGIEDPEKEVLMWKFDSHLAFRHMARELHPEYYKDC", @@ -5229,9 +5229,9 @@ { "name": "gag", "start": 773, - "end": 2276, + "end": 2275, "subtype_start": 200, - "subtype_end": 1700, + "subtype_end": 1699, "orientation": "forward", "distance": 0.3910844507174782, "protein": "MGARASVLSGGELDRWERIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSKGCRQILEQLQPALQTGSEELKSLYNTVATLYCVHQKIDVKDTKEALDKIEEEQNKSKKKAQQAAADTGNNSQASQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQCTQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTTPGTIMMQRGNLRSQRKTVKCFNCGKEGHIAKNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQEPIDKEMYPLASLRSLFGNDPSSQ", @@ -5241,9 +5241,9 @@ { "name": "pol", "start": 2068, - "end": 5080, + "end": 5079, "subtype_start": 1492, - "subtype_end": 4504, + "subtype_end": 4503, "orientation": "forward", "distance": 0.21863141758600757, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQRNVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMTLPGRWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVKQLCKLLRGTKALTEVIPLTREAELELAENREILKEPVHGVYYDPTKDLIVEIQKQGQGQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFRLPIQRETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLIKKDKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIDKAQDDHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGGNFISTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVYIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKLQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5253,9 +5253,9 @@ { "name": "vif", "start": 5024, - "end": 5603, + "end": 5602, "subtype_start": 4448, - "subtype_end": 5027, + "subtype_end": 5026, "orientation": "forward", "distance": 0.3264662839130924, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYISRKAKGWVYKHHYDSTHPRISSEVHIPLGDAKLVITTYWGLHTGERDWHLGQGVSIEWRKKRYSTQVDPGLADQLIHLYYFDCFSESAIRNAILGHIVSPSCDYQAGHNKVGSLQYLALAALITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -5265,9 +5265,9 @@ { "name": "vpr", "start": 5542, - "end": 5833, + "end": 5832, "subtype_start": 4966, - "subtype_end": 5257, + "subtype_end": 5256, "orientation": "forward", "distance": 0.2678354029705382, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKNEAVRHFPRPWLHSLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGIIQRRRARNGASRS", @@ -5277,9 +5277,9 @@ { "name": "tat_exon1", "start": 5813, - "end": 6032, + "end": 6031, "subtype_start": 5237, - "subtype_end": 5456, + "subtype_end": 5455, "orientation": "forward", "distance": 0.2515090543259557, "protein": "MEPVDPRLEPWKHPGSQPRTACTSCYCKQCCFHCQVCFITKGLGISYGRKKRRQRRRAPPDSQTHQASLSKQ", @@ -5289,21 +5289,21 @@ { "name": "rev_exon1", "start": 5952, - "end": 6033, + "end": 6029, "subtype_start": 5376, - "subtype_end": 5454, + "subtype_end": 5453, "orientation": "forward", - "distance": 0.4807692307692307, - "protein": "MAGRSGDSDEELLQTVRLIKLLYQSSK", - "aminoacids": "MAGRSGDSDEELLQTVRLIKLLYQSSK", - "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGTAAG" + "distance": 0.4267425320056898, + "protein": "MAGRSGDSDEELLQTVRLIKLLYQSS", + "aminoacids": "MAGRSGDSDEELLQTVRLIKLLYQSS", + "nucleotides": "ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCCAGACAGTCAGACTCATCAAGCTTCTCTATCAAAGCAGT" }, { "name": "vpu", "start": 6044, - "end": 6290, + "end": 6289, "subtype_start": 5468, - "subtype_end": 5708, + "subtype_end": 5707, "orientation": "forward", "distance": 0.4384802297327147, "protein": "MQPLHIAAIVALVVAIIIAIVVWSIVFIEYRKILRQRKIDRIIDRIRERAEDSGNESEGDQEELSALVEMGHCAPWDVNDL", @@ -5313,9 +5313,9 @@ { "name": "env", "start": 6207, - "end": 8790, + "end": 8789, "subtype_start": 5631, - "subtype_end": 8208, + "subtype_end": 8207, "orientation": "forward", "distance": 0.4684887834843129, "protein": "MRVRGIKKNYQHLWRWGIVLLGMLMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDTEVHNVWATHACVPTDPNPQEVVLGNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTNYNNTNNTTSTNDTTSTTTSSGEKMKEGEIKNCSFNITTSIRDKVQKEYALFYKPDIVPIDNDNTSYRLISCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNDKKFNGTGSCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSENFSDNAKTIIVHLNESVEITCIRPNNNTRKSIPIGPGRAFYATGAIIGDIRQAHCKINKTKWNNTLDQIFKKLREQFGNKTIIFTHSSGGDPEVVTHNFNCGGEFFYCNTTKLFNSTWNETSYWKDERSNDNDTITLPCRIKQIINLWQEVGKAMYAPPIRGYIKCSSNITGLLITRDGGKNESNTTETFRPGGGNMRDNWRSELYKYKVVKIEPLGIAPTKAKRRVVQREKRAVGIGAVFLGFLGAAGSTMGAASITLTVQARLLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARVLAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWDNMTWMEWEREIDNYTSLIYTLIEKSQNQQEKNEQELLELDKWASLWNWFDITKWLWYIKIFIMIVGGLVGLRIVFAVLSIANRVRQGYSPLSFQTHLPAPRGPDRPEGIEEEGGERDRDRSGPLVNGFLTIIWVDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWELLKYWWNLLQYWSQELKNSAISLLNATAIAVAEGTDRIIEVLQRAGRAFLHIPRRIRQGLERALL", @@ -5325,9 +5325,9 @@ { "name": "tat_exon2", "start": 8371, - "end": 8467, + "end": 8466, "subtype_start": 7789, - "subtype_end": 7885, + "subtype_end": 7884, "orientation": "forward", "distance": 0.4971219256933542, "protein": "RPTSQPRGDPTGQKESKKKVERETETDPDH", @@ -5337,9 +5337,9 @@ { "name": "rev_exon2", "start": 8372, - "end": 8648, + "end": 8647, "subtype_start": 7790, - "subtype_end": 8066, + "subtype_end": 8065, "orientation": "forward", "distance": 0.3934495959166312, "protein": "DPPPSPEGTRQARRNRRRRWRERQRQIRTISERILNNYLGRPAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGTPQILVESPAVLESGTKE", @@ -5349,9 +5349,9 @@ { "name": "nef", "start": 8791, - "end": 9412, + "end": 9411, "subtype_start": 8209, - "subtype_end": 8842, + "subtype_end": 8841, "orientation": "forward", "distance": 0.36363636363636354, "protein": "MGGKWSKSSVVGWPAIRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNADCAWLEAQEDEEVGFPVRPQVPLRPMTYKGAVDLSHFLKEKGGLEGLIHSQKRQDILDLWVYHTQGYFPDWQNYTPGPGIRYPLTFGWCFKLVPVEPDKVEEANEGENNSLLHPMSLHGMDDPEKEVLVWRFDSRLAFHHMARELHPEYYKDC", @@ -5363,9 +5363,9 @@ { "name": "gag", "start": 808, - "end": 2308, + "end": 2307, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.2880084183556755, "protein": "MGARASVLSGGELDKWEKIRLRPGGKKQYKLKHLVWASRELERFAVNPGLLETSEGCRQILGQLQPALQTGSEEFRSLYNTVATLYCVHQKIEVKDTKEALEKIEEEQNQSKKKAAAAAADTGNRSQVSQNYPIVQNLQGQMVHQPLSPRTLNAWVKVIEEKAFSPEVIPMFTALSEGATPQDLNTMLNTIGGHQAAMQMLKETINEEAAEWDRLHPVQAGPVAPGQMREPRGSDIAGTTSNLQEQIGWMTHNPPIPVGDIYKRWIILGLNKIVRMYSPVSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSTVMMQRGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSKPEPTAPPEESFRFGEETTTPSQKQGPIDKELYPLASLKSLFGNDPSSQ", @@ -5375,9 +5375,9 @@ { "name": "pol", "start": 2100, - "end": 5112, + "end": 5111, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.1880239208210378, "protein": "FFREDLAFPQGEAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEDMNLPGKWKPKMIGGIGGFIKVRQYDQILVEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSIPLDKDFRKYTAFTIPSTNNETPGIRYQYNVLPQGWKGSPAIFQSSMTRILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLKWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIKLPEKDSWTVNDIQKLVGKLNWASQIYAGIKVRQLCKLLRGTKALTEVVPLTAEAELELAENREILKEPVHGVYYDPTKDLIAELQKQGQSQWTYQIYQEPFKNLKTGKYARMRGAHTNDVKQLTEAVQKIAIESIVIWGKTPKFKLPIQKETWETWWTDYWQATWIPDWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETRSGKAGYVTDRGRQKVVPLTDTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSSGIRKILFLDGITKAQDDHERYHSNWRAMASDFNLPPIIAKEIVASCDKCQLKGEATHGQVDCSPGIWQLDCTHLEGKIILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTVHTDNGSNFTSAAVKAACWWAGIKQEFGIPYNPQSQGVIESMNKELKKIIGQVREQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIIDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -5387,9 +5387,9 @@ { "name": "vif", "start": 5056, - "end": 5635, + "end": 5634, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.41532297468972923, "protein": "MENRWQVMIVWQVDRMRIRTWNSLVKHHIHVSKKAKGWVYRHHYESTHPRISSEVHIPLGEARLVIATYWGLHTGERDWHLGQGVSIEWREKKYITQVDPDLADQLIHLHYFDCFSESAIRNAIVGRLVSPQCEYQTGHNKVGSLQYLALVALITPKKRKPPLPSVRKLTEDRWNKPQKTKDHRGSHIMSGH", @@ -5399,9 +5399,9 @@ { "name": "vpr", "start": 5574, - "end": 5865, + "end": 5864, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3120665742024965, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKSEAVRHFPRIWLHNLGQYIYATYGDTWTGVEALIRILQQLLFIHFRIGCQHSRIGITRQRRARNGASRS", @@ -5411,9 +5411,9 @@ { "name": "tat_exon1", "start": 5845, - "end": 6064, + "end": 6063, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTPCTNCYCKKCCFHCQVCFIKKALGISYGRKKRRQRRRPPQNSETHQAALSKQ", @@ -5423,9 +5423,9 @@ { "name": "rev_exon1", "start": 5984, - "end": 6065, + "end": 6064, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKQLYQSSK", @@ -5435,9 +5435,9 @@ { "name": "vpu", "start": 6076, - "end": 6340, + "end": 6339, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.4955621301775147, "protein": "MQPLVILAIVALVVAAIIAIVVWTIVLIEYRKILRQRKIDSIINRIRERAEDSGNESEGDQEELSALVEMGHHVEMGHHAPWNVDDL", @@ -5447,9 +5447,9 @@ { "name": "env", "start": 6239, - "end": 8807, + "end": 8806, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4703403690377699, "protein": "MRVKEIRKNCRHLWRWGTMWKWGTMLLGMLMICSAKEQLWVTVYYGVPVWKEATTTLFCASNAKAYDPEVHNVWATHACVPTDPNPQEVPLENVTENFNMWKNNMVEQMHEDIISLWDQSLKPCVKLTPLCVILNCTNVNVTTNNNSSSEEQMEVGEIKNCSFNIATRIKNKIKKEYALFNRLDVVPIEDDNTSYMLINCNTSVTTQACPKVTFEPIPIHYCAPAGFAILKCNDKKFNGTGPCNNVSTVQCTHGIKPVVSTQLLLNGSLAEEEIVVRSENFTNNAKTIIVQLNKTIEINCIRPNNNTRKSISLRPGQAIYATEDIIGNIRQAHCNIRRKDWDKALEQVVAKLREQFKNKTIVFNQSSGGDPEIVMHSFNCAGEFFYCNTTKLFNSTWNVNNTRNNTTDNSTITLPCRIKQIINRWQEVGKAMYAPPIKGQIKCSSNITGLLLTRDGGVREDNAPEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQRGKRAVTLGAMFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLAVERYLQDQQLLGIWGCSGKLICTTAVPWNTSWSNKSLEKIWKNMTWMEWEKEINNYTRTIYTLIEESQNQQEKNEQELLELDKWASLWNWFDITNWLWYIKIFIMIVGGIVGLRIVFTVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGTEEEGGERDRDRSGQLVNGFFALIWDDLQSLCLFSYRRLRDLLLIVARIVELLGHRGWEALKYWWNLLQYWSQELKKSAVSLLNATAIAVAEGTDRVIEVVQRIGRAILHIPRRIRQGLERALL", @@ -5459,9 +5459,9 @@ { "name": "tat_exon2", "start": 8388, - "end": 8484, + "end": 8483, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.4918032786885247, "protein": "RPASQLRGDQTGPKEQKKKVERETETDPGN", @@ -5471,9 +5471,9 @@ { "name": "rev_exon2", "start": 8389, - "end": 8674, + "end": 8673, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4123815285339786, "protein": "DPLPSSEGTRQARRNRRRRWRERQRQIRAISERILCAYLGRPAEPVPLQLPPLERLTLDCSEDCGTSGTQGVGGPQILVESPAVLESGTKEECC", @@ -5483,9 +5483,9 @@ { "name": "nef", "start": 8808, - "end": 9417, + "end": 9416, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.484764542936288, "protein": "MGGKWSKCSLVGWPAIRERMRRAEPAPAAEGVGAASRDLEKHGALTTSNTAANNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKGAMDLGHFLKEKGGLEGLIYSPKRQEILDLWVYHTQGYFPDWQNYTPGPGTRYPLTFGWCFKLVPVEPDEGENSCLLHPMNQHGADDTEREVLMWKFDSSLAFHHKARELHPEYYKNC", diff --git a/tests/expected-results-single-csv/holistic.csv b/tests/expected-results-single-csv/holistic.csv index 57ad129..b317787 100644 --- a/tests/expected-results-single-csv/holistic.csv +++ b/tests/expected-results-single-csv/holistic.csv @@ -1,2 +1,2 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8793,3 diff --git a/tests/expected-results-single-csv/orfs.csv b/tests/expected-results-single-csv/orfs.csv index 5c8fb54..cf06ef8 100644 --- a/tests/expected-results-single-csv/orfs.csv +++ b/tests/expected-results-single-csv/orfs.csv @@ -1,12 +1,12 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides -MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN692145,gag,775,2280,789,2291,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692145,pol,2070,5084,2084,5095,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5607,5040,5618,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5837,5558,5848,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6036,5829,6044,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6037,5968,6045,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6297,6060,6308,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8782,6223,8793,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8459,8375,8470,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8640,8376,8651,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9386,8795,9415,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA diff --git a/tests/expected-results-single-hxb2/holistic.json b/tests/expected-results-single-hxb2/holistic.json index 9a1c5bf..43acd43 100644 --- a/tests/expected-results-single-hxb2/holistic.json +++ b/tests/expected-results-single-hxb2/holistic.json @@ -8,7 +8,7 @@ "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-single-hxb2/orfs.json b/tests/expected-results-single-hxb2/orfs.json index 3c10e8a..285ff83 100644 --- a/tests/expected-results-single-hxb2/orfs.json +++ b/tests/expected-results-single-hxb2/orfs.json @@ -3,9 +3,9 @@ { "name": "gag", "start": 775, - "end": 2281, + "end": 2280, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.20784453738651432, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", @@ -15,9 +15,9 @@ { "name": "pol", "start": 2070, - "end": 5085, + "end": 5084, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.14843087362171337, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", @@ -27,9 +27,9 @@ { "name": "vif", "start": 5029, - "end": 5608, + "end": 5607, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", @@ -39,9 +39,9 @@ { "name": "vpr", "start": 5547, - "end": 5838, + "end": 5837, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", @@ -51,9 +51,9 @@ { "name": "tat_exon1", "start": 5818, - "end": 6037, + "end": 6036, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -63,9 +63,9 @@ { "name": "rev_exon1", "start": 5957, - "end": 6038, + "end": 6037, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -75,9 +75,9 @@ { "name": "vpu", "start": 6049, - "end": 6298, + "end": 6297, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.520618556701031, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", @@ -87,9 +87,9 @@ { "name": "env", "start": 6212, - "end": 8783, + "end": 8782, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", @@ -99,9 +99,9 @@ { "name": "tat_exon2", "start": 8364, - "end": 8460, + "end": 8459, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -111,9 +111,9 @@ { "name": "rev_exon2", "start": 8365, - "end": 8641, + "end": 8640, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -123,9 +123,9 @@ { "name": "nef", "start": 8784, - "end": 9387, + "end": 9386, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", diff --git a/tests/expected-results-single/holistic.json b/tests/expected-results-single/holistic.json index 9a1c5bf..43acd43 100644 --- a/tests/expected-results-single/holistic.json +++ b/tests/expected-results-single/holistic.json @@ -8,7 +8,7 @@ "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-single/orfs.json b/tests/expected-results-single/orfs.json index 3c10e8a..285ff83 100644 --- a/tests/expected-results-single/orfs.json +++ b/tests/expected-results-single/orfs.json @@ -3,9 +3,9 @@ { "name": "gag", "start": 775, - "end": 2281, + "end": 2280, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.20784453738651432, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", @@ -15,9 +15,9 @@ { "name": "pol", "start": 2070, - "end": 5085, + "end": 5084, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.14843087362171337, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", @@ -27,9 +27,9 @@ { "name": "vif", "start": 5029, - "end": 5608, + "end": 5607, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", @@ -39,9 +39,9 @@ { "name": "vpr", "start": 5547, - "end": 5838, + "end": 5837, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", @@ -51,9 +51,9 @@ { "name": "tat_exon1", "start": 5818, - "end": 6037, + "end": 6036, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -63,9 +63,9 @@ { "name": "rev_exon1", "start": 5957, - "end": 6038, + "end": 6037, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -75,9 +75,9 @@ { "name": "vpu", "start": 6049, - "end": 6298, + "end": 6297, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.520618556701031, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", @@ -87,9 +87,9 @@ { "name": "env", "start": 6212, - "end": 8783, + "end": 8782, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", @@ -99,9 +99,9 @@ { "name": "tat_exon2", "start": 8364, - "end": 8460, + "end": 8459, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -111,9 +111,9 @@ { "name": "rev_exon2", "start": 8365, - "end": 8641, + "end": 8640, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -123,9 +123,9 @@ { "name": "nef", "start": 8784, - "end": 9387, + "end": 9386, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", diff --git a/tests/expected-results-small-csv/errors.csv b/tests/expected-results-small-csv/errors.csv index 39f058b..8fe3ff6 100644 --- a/tests/expected-results-small-csv/errors.csv +++ b/tests/expected-results-small-csv/errors.csv @@ -1,32 +1,32 @@ sequence_name,error,message -KX505501.1,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 2721" -KX505501.1,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6322 -KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" -KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" -KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 -KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004 -KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions. -KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions. -KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" -KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" +KX505501.1,DeletionInOrf,"ORF pol at 2084-5095 can have maximum deletions 30, got 2721" +KX505501.1,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6322 +KX505501.1,InsertionInOrf,"Smaller ORF vif at 5040-5618 can have maximum insertions 90, got 909" +KX505501.1,DeletionInOrf,"Smaller ORF vpr at 5558-5848 can have maximum deletions 30, got 66" +KX505501.1,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892 +KX505501.1,InternalStopInOrf,Smaller ORF rev_exon1 at 5968-6045 contains an internal stop codon at 6004 +KX505501.1,FrameshiftInOrf,Smaller ORF vpu at 6060-6308 contains out of frame indels that impact 190 positions. +KX505501.1,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 51 positions. +KX505501.1,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 96" +KX505501.1,InsertionInOrf,"Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 867" KX505501.1,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. KX505501.1,LongDeletion,Query sequence contains a long deletion. KX505501.1,Scramble,Sequence is plus-scrambled. -MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123 -MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 -MN692074,DeletionInOrf,"ORF pol at 2084-5096 can have maximum deletions 30, got 981" -MN692074,InternalStopInOrf,ORF env at 6223-8794 contains an internal stop codon at 6550 -MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" -MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" -MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892 -MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" -MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions. -MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" -MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" +MN691959,InternalStopInOrf,Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6123 +MN691959,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 +MN692074,DeletionInOrf,"ORF pol at 2084-5095 can have maximum deletions 30, got 981" +MN692074,InternalStopInOrf,ORF env at 6223-8793 contains an internal stop codon at 6550 +MN692074,DeletionInOrf,"Smaller ORF vif at 5040-5618 can have maximum deletions 30, got 81" +MN692074,InsertionInOrf,"Smaller ORF vpr at 5558-5848 can have maximum insertions 90, got 207" +MN692074,InternalStopInOrf,Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892 +MN692074,InsertionInOrf,"Smaller ORF vpu at 6060-6308 can have maximum insertions 90, got 249" +MN692074,FrameshiftInOrf,Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 40 positions. +MN692074,DeletionInOrf,"Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 204" +MN692074,InsertionInOrf,"Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 882" MN692074,RevResponseElementDeletion,Query Sequence exceeds maximum deletion tolerance in RRE. Contains 265 deletions with max tolerance of 20 deletions. MN692074,LongDeletion,Query sequence contains a long deletion. -MN090335,InternalStopInOrf,ORF gag at 789-2292 contains an internal stop codon at 822 -MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420 +MN090335,InternalStopInOrf,ORF gag at 789-2291 contains an internal stop codon at 822 +MN090335,InternalStopInOrf,Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420 MN090335,PackagingSignalDeletion,Query Sequence exceeds maximum deletion tolerance in PSI. Contains 42 deletions with max tolerance of 10 deletions. MN090335,MajorSpliceDonorSiteMutated,"Query sequence has a mutated splice donor site, AT." MN090335,Scramble,Sequence is minus-scrambled. diff --git a/tests/expected-results-small-csv/holistic.csv b/tests/expected-results-small-csv/holistic.csv index 352edd3..c47d0e7 100644 --- a/tests/expected-results-small-csv/holistic.csv +++ b/tests/expected-results-small-csv/holistic.csv @@ -1,6 +1,6 @@ seqid,qlen,hypermutation_probablility,inferred_subtype,blast_matched_qlen,blast_sseq_coverage,blast_qseq_coverage,blast_sseq_orfs_coverage,orfs_start,orfs_end,blast_n_conseqs -KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17663960024984385,789,8794,4 -MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8794,3 -MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.4114928169893816,789,8794,4 -MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8794,3 -MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.0003747657713928,789,8794,3 +KX505501.1,1997,0.7087072014754221,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,1997,0.2498456472525211,1.2158237356034052,0.17666166916541728,789,8793,4 +MN691959,9493,0.19667690182893238,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9493,1.0817040543321672,1.1086063415148004,1.0,789,8793,3 +MN692074,4178,0.36378645339477633,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,4178,0.5042189750977567,1.1728099569171853,0.411544227886057,789,8793,4 +MN692145,9689,0.1672411051048176,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9689,1.130479522535501,1.1271545051088863,1.0,789,8793,3 +MN090335,9069,0.1771850809736527,Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455,9069,0.9842560197571517,1.0603153600176425,1.000374812593703,789,8793,3 diff --git a/tests/expected-results-small-csv/orfs.csv b/tests/expected-results-small-csv/orfs.csv index a5fce96..3b445d9 100644 --- a/tests/expected-results-small-csv/orfs.csv +++ b/tests/expected-results-small-csv/orfs.csv @@ -1,56 +1,56 @@ seqid,name,start,end,subtype_start,subtype_end,orientation,distance,protein,aminoacids,nucleotides -KX505501.1,env,0,1824,6223,8794,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,vif,0,1824,5040,5619,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,nef,0,1824,8795,9416,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,tat_exon1,1,1750,5829,6045,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,gag,336,1824,789,2292,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon1,1306,1750,5968,6046,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT -KX505501.1,vpr,1599,1824,5558,5849,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,vpu,1599,1824,6060,6309,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,pol,1627,1927,2084,5096,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -KX505501.1,tat_exon2,1746,1824,8375,8471,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG -KX505501.1,rev_exon2,1747,1927,8376,8652,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA -MN691959,gag,639,2142,789,2292,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN691959,pol,1934,4946,2084,5096,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN691959,vif,4890,5469,5040,5619,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG -MN691959,vpr,5408,5699,5558,5849,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG -MN691959,tat_exon1,5679,5898,5829,6045,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN691959,rev_exon1,5818,5899,5968,6046,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN691959,vpu,5910,6156,6060,6309,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG -MN691959,env,6070,8656,6223,8794,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA -MN691959,tat_exon2,8237,8333,8375,8471,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA -MN691959,rev_exon2,8238,8514,8376,8652,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG -MN691959,nef,8657,9278,8795,9416,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA -MN692074,nef,0,4059,8795,9416,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG -MN692074,env,2,4115,6223,8794,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,gag,789,2292,789,2292,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN692074,pol,2084,4115,2084,5096,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vif,3617,4115,5040,5619,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpr,3617,4115,5558,5849,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,vpu,3617,4115,6060,6309,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA -MN692074,tat_exon1,3823,4084,5829,6045,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,rev_exon1,3823,4084,5968,6046,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC -MN692074,tat_exon2,4080,4164,8375,8471,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA -MN692074,rev_exon2,4081,4153,8376,8652,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG -MN692145,gag,775,2281,789,2292,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA -MN692145,pol,2070,5085,2084,5096,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN692145,vif,5029,5608,5040,5619,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG -MN692145,vpr,5547,5838,5558,5849,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG -MN692145,tat_exon1,5818,6037,5829,6045,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA -MN692145,rev_exon1,5957,6038,5968,6046,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG -MN692145,vpu,6049,6298,6060,6309,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG -MN692145,env,6212,8783,6223,8794,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA -MN692145,tat_exon2,8364,8460,8375,8471,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -MN692145,rev_exon2,8365,8641,8376,8652,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG -MN692145,nef,8784,9387,8795,9416,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA -MN090335,gag,315,1665,789,2292,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA -MN090335,pol,1427,4469,2084,5096,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG -MN090335,vif,4413,4992,5040,5619,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG -MN090335,vpr,4931,5222,5558,5849,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG -MN090335,tat_exon1,5202,5421,5829,6045,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA -MN090335,rev_exon1,5341,5422,5968,6046,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG -MN090335,vpu,5433,5682,6060,6309,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG -MN090335,env,5596,8158,6223,8794,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA -MN090335,tat_exon2,7739,7835,8375,8471,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA -MN090335,rev_exon2,7740,8016,8376,8652,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG -MN090335,nef,8159,8813,8795,9416,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA +KX505501.1,env,0,1823,6223,8793,forward,0.7623480451210163,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vif,0,1823,5040,5618,forward,0.7647696476964769,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,nef,0,1823,8795,9415,forward,0.764345579086969,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,GLSG*TRSEPGSSLAN*GTHCLSLNKACLECFK*CVPVCCVTLVTRDPSDPFSQCGKSLAVAPEQGPESERETRGALSTQDSAC*ARAARGEGRRLVSTPKIF*LAEARRREMGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,tat_exon1,1,1749,5829,6044,forward,0.7680130480667754,MRKLQNGIDCIQCMQGLLHQAR,VSLVRPDLSLGALWLTREPTA*ASIKLALSASSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKGKPEELSRRRTRLAERAQQEARGGDW*VRRKFFD*RRLEGERWVRERQY*AGENWIDGKKFG*GQEEIKDIN*NI*YGQAES*NDSQLILAC*KHQKAVDKYWDSYNRLLRQDQKNLSLCIIQ*QSSIVYIKK*M*KTPRKP*TR*KKSKTKLGNKHSKPQLQEVAVRSATITL*CRIIRGKWYIRPCHQEL*MHG*K**RKRLSAQK*YPCFQHYQKEPPHKT*TPC*IQWGDIKQPCKC*KRPLMRKLQNGIDCIQCMQGLLHQAR*ENQGEVT*QELLVPFRNK*HG*QIIHLSQ*ERFIKDG*S*G*IK**ECIALSAFWT*DKDQRNLLETM*TGSIKP*EPNKPHRK*KIG*QKPCWSRMRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,GTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACCTGAAAGCGAAAGGGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAGCGCGCGCAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAATTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,gag,336,1823,789,2291,forward,0.3997973809613161,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTGGATAGATGGGAAAAAATTCGGCTAAGGCCAGGAGGAAATAAAAGATATAAACTAAAACATATAGTATGGGCAAGCAGAGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGCTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCGACTCTTAAGACAGGATCAGAAGAACTTAAGTCTTTGTATAATACAATAGCAGTCCTCTATTGTGTACATCAAAAAATAGATGTGAAAGACACCAAGGAAGCCTTAGACAAGATAGAAGAAGAGCAAAACAAAATTAGGAAACAAGCACAGCAAACCGCAGCTGCAGGAAGTAGCAGTCAGGTCAGCCACAATTACCCTGTAGTGCAGAATCATCAGGGGCAAATGGTATATCAGGCCCTGTCACCAAGAACTTTAAATGCATGGGTAAAAGTAATAGAGGAAAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGACTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATTAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATCCTAGGGTTAAATAAAATAGTAAGAATGTATAGCCCTGTCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCTTTTAGAGACTATGTAGACCGGTTCTATAAAACCCTAAGAGCCGAACAAGCCACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon1,1306,1749,5968,6045,forward,0.758082497212932,MRTQIVKLF,MRTQIVKLF*KH*DQQPH*KK**QHAREWEDPAIKQEFWLKQ*AK*QIQLQ**CRKAILGTKEKLLSASIVAKKGT*PEIAGPLEKRAVGNVEGKDIK*KTVLRDRLIL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLD,ATGCGAACCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCCACACTAGAAGAAATGATGACAGCATGCCAGGGAGTGGGAGGACCCAGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAATGACAAATTCAGCTACAGTAATGATGCAGAAAGGCAATTTTAGGAACCAAAGAAAAACTGTTAAGTGCTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGAAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACATCAAATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGAT +KX505501.1,vpr,1599,1823,5558,5848,forward,0.763687959047407,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,vpu,1599,1823,6060,6308,forward,0.7672672672672673,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ,MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ*,ATGAAAGACTGTACTGAGAGACAGGCTAATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,pol,1627,1926,2084,5095,forward,0.7724330674761569,GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,IL*GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,ATTTTGTAGGGAAAATCTGGCCTTCCCACAAGGGAAGGCCGGGGAATTTCCTTCAGAACAGACCAGAGCCAACAGCCCCACCAGCAGAGAGCTTCAGGTTTGGGGAAGAGACACCAACTAGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +KX505501.1,tat_exon2,1746,1823,8375,8470,forward,0.7616257781032589,RCIRSTTRTADTELFTRDFPLGTFQ,RCIRSTTRTADTELFTRDFPLGTFQ*,AGATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAG +KX505501.1,rev_exon2,1747,1926,8376,8651,forward,0.7620186257236345,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI,DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI*,GATGCATCCGGAGTACTACAAGGACTGCTGACACTGAGCTTTTCACAAGGGACTTTCCGCTGGGGACTTTCCAGTAGGGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACGAGGTCTCTCTGGTTAGACCAGATCTGA +MN691959,gag,639,2141,789,2291,forward,0.0801186943620179,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ,MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAGAATTAGATCGATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAAATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGAGATAAAAGACACCAAGGAAGCTTTAGAGAAGATAGAGGAAGAGCAAAACAAAAGTAAGAAAAAAGCACAGCAAGCAGCAGCTGACACAGGACACAGCAACCAGATCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAGTGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCYWYCTWTCCCAGTAGGAGAAATTTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTCTGGACATAAGACAAGGACCAAAAGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTAAAAGCATTGGGACCWGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAGGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGAGTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN691959,pol,1934,4945,2084,5095,forward,0.054722889368558514,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAGATCTGGCCTTCCTACAAGGGAAGGCCAGGGAATTTTCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTCTGGGGTAGAGACAACAACTCCCTCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAACTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAAGACTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAGCTGAGACAACATCTGTTGAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAGAGCATTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGTATAGTAATATGGGGAAAGACTCCTAGATTTAAACTACCCATACAAAAGGAAACATGGGAAACATGGTGGACAGAATATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCTTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGGTATGTTACTAACAAAGGAAGACAAAAGGTTGTCCCCCTAACTAACACAACAAATCAGAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATCAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAGCAGTTAATAAAAAAGGAAAAGGTCTATCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTGCTGGAATCAGGAAAATACTATTTTTAGATGGAATAGATAAGGCCCAAGATGAACATGAGAAATATCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAACTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGGCAGGAAACAGCATATTTTCTTTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTGCTACGGTTAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGAATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTCCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN691959,vif,4890,5468,5040,5618,forward,0.09157509157509158,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAGGGGATGGTTTTATAGACATCACTATGAAAGAACTCATCCAAGAATAAGTTCAGAAGTATACATCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGACTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCTGAACTAGCAGACCAACTAATTCATCTGTATTACTTTGACTGTTTTTCAGACTCTGCTATAAGAAAGGCCTTATTAGGACATATAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAGCAGCATTAATAACACCAAAAAAGATAAAGCCACCTTTGCCTAGTGTTACAAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAG +MN691959,vpr,5408,5698,5558,5848,forward,0.09157509157509158,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS,MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGGGAGCCACACAATGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATTTGGCTCCATGGCTTAGGGCAACATATCTATGAAACTTATGGGGATACTTGGGCAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTTATCCATTTCAGAATTGGGTGTCGACATAGCAGAATAGGCGTTACTCAACAGAAGAGAGCAAGAAATGGAGCCAGTAGATCCTAG +MN691959,tat_exon1,5679,5894,5829,6044,forward,0.28735632183908044,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ,ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG +MN691959,rev_exon1,5818,5898,5968,6045,forward,0.4807692307692307,MAGRSGDSDEDLLKTVRLIKFLYQSSK,MAGRSGDSDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN691959,vpu,5910,6155,6060,6308,forward,0.7333193453629878,MQPIQIAIVALVVAIIIAIVV,MQPIQIAIVALVVAIIIAIVV*SIVIIEYRKILRQRKIDRLIDRLIERAEDSGNESEGEVSALVEMGVEMGHHAPWDIDDL*,ATGCAACCTATACAAATAGCAATAGTAGCATTAGTAGTAGCAATAATAATAGCAATAGTTGTGTGATCCATAGTAATCATAGAATATAGGAAAATATTAAGACAAAGGAAAATAGACAGGTTAATTGATAGACTAATAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAG +MN691959,env,6070,8655,6223,8793,forward,0.1405525502318391,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL,MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL*,ATGAGAGTGAAGGAGAAGTGTCAGCACTTGTGGAGATGGGGGTGGAGATGGGGCACCATGCTCCTTGGGATATTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAGGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGATGCAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGTATTGGTAAATGTGACAGAAAATTTTAACATGTGGAAAAATGACATGGTAGAACAGATGCATGAGGATATAATCAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAGTTTAAAGTGCACTGATTTGGGGAATGCTACTAATACCAATAGTAGTAATACCAATAGTAGTAGCGGGGAAATGATGATGGAGAAAGGAGAGATAAAAAACTGCTCTTTCAATATCAGCACAAGCATAAGAAATAAGGTGCAGAAAGAATATGCATTCTTTTATAAACTTGATATAGTACCAATAGATAATGATACTACCAGCTATACGTTGACAAGTTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCCATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAATGTAATAATAAGACGTTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAATGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGCAGTCTAGCAGAAGAAGATGTAGTAATTAGATCTGCCAATTTCACAGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATCCGTATCCAGAGAGGACCAGGGAGAGCATTTGTTACAATAGGAAAAATAGGAAATATGAGACAAGCACATTGTAACATTAGTAGAGCAAAATGGAATGCCACTTTAAAACAGATAGCTAGCAAATTAAGAGAACAATTTGGAAATAATAAAACAATAATCTTTAAGCAATCCTCAGGAGGGGACCCAGAAATTGTAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATTCAACACAACTGTTTAATAGTACTTGGTTTAATAGTACTTGGAGTACTGAAGGGTCAAATAACACTGAAGGAAGTGACACAATCACACTCCCATGCAGAATAAAACAATTTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGCGGACAAATTAGATGTTCATCAAATATTACAGGGCTGCTATTAACAAGAGATGGTGGTAATAACAACAATGGGTCCGAGATCTTCAGACCTGGAGGAGGAGATATGAGGGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAAAATTGAACCATTAGGAGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTTTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAATGACGCTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAGCAGCAGAACAATTTGCTGAGGGCTATTGAGGCGCAACAGCATCTGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAATCCTGGCTGTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGATTTGGGGCTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGAACAGATTTGGAATAACATGACCTGGATGGAGTGGGACAGAGAAATTAACAATTACACAAGCTTAATACACTCCTTAATTGAAGAATCGCAAAACCAGCAAGAAAAGAATGAACAAGAATTATTGGAATTAGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAATTGGCTGTGGTATATAAAATTATTCATAATGATAGTAGGAGGCTTGGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCTATAGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAGGAGCTTATAGAGCTATTCGCCACATACCTAGAAGAATAAGACAGGGCTTGGAAAGGATTTTGCTATAA +MN691959,tat_exon2,8237,8332,8375,8470,forward,0.6672629695885509,RPTSQTRGDPTGPKE,RPTSQTRGDPTGPKE*KKKVERETETDPFD**,AGACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGA +MN691959,rev_exon2,8238,8513,8376,8651,forward,0.210025203024363,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE,DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE*,GACCCACCTCCCAAACCCGGGGGGACCCGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCATTCGATTAGTGAACGGATCCTTAGCACTTATCTGGGACGATCTGCGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATTGTAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGCCCTCAAATATTGGTGGAATCTCCTACAATATTGGAGTCAGGAGCTAAAGAATAG +MN691959,nef,8657,9277,8795,9415,forward,0.06582796957284964,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC,MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC*,ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGATCAGATATCCATTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGGTAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGAATGGATGACCCTGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA +MN692074,nef,0,4058,8795,9415,forward,0.7628009106462086,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,WKG*FGPRKDKISLICGSTTHKATSLIGRTTHQGRGPDFH*PLDGASS*YQLIQRR*KRPMQERTTACYTL*ACMGWRTRRKKC*CGSLTAA*HFITWPESCIRSTTRIADFELSTRDFPLGTFQGGVAWAGLGSGEPSDAAYKQLLFACTGSLWLDQI*AWELSG*LGNPLLKPQ*SLP*VL*VVCARLLCDSGN*RSLRPF*SVWKISSSGARTGT*KRKRNQRSSLDAGLGLLKRARQEARGGDW*VRQKF*LAEARRREMGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*G*GGN*RKLY*IQEQMIQY*KK*ICQEDGNQK**GELEVLSK*DSMIRYS*KSVDIKL*VQY**DLHLST*LEEIC*LRLVAL*IFPLVLLKLYQ*N*SQEWMAQKLNNGH*QKKK*KH**KFVQKWKRKGKFQKLGLKIHTILQYLP*RKKTVLNGEN**ISENLIRELKTSGKFN*EYHIPQG*ERKNQ*QYWMWGMHIFQFP*IKNLGNILHLPYPVETMRHQGLDISTMCFHRDGKDHQQYSKVA*QKF*SLLENKIQK*LSINTWMIYM*DLI*K*GSIE*K*RN*DNIC*DGDLPHQTKNIRKNPHSFGWVMNSILINGQYSL*CCQKKTAGLSMTYRS*WEN*IGQVRFTQGLK*GNYVNSLGEPKH*QK*YH*QKKQSWNWQKTGKF*KNQYMEYIMTHQKT**QKYRSRGKVNGHIKFIKSHLKI*KQENMQK*GVPTLMM*NN*QRQCKK*PQKA**YGERLLNLNYPYKKKHGKHGGQSIGKPPGFLSGSLSIPLP**NYGTS*RKNP**EQKPSM*MGQLTGRLN*EKQDMLLTEEDKKLSP*LTQQIRRLNYKQFI*LCRIRD*K*T**QTHNMH*,TGGAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAG +MN692074,env,2,4114,6223,8793,forward,0.76033143808071,MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,EGLIWSQKRQDILDLWIYHTQGYFPDWQNYTPGPGTRFPLTFGWCFKLVPVDPEKVEEANAGENNSLLHPISLHGMEDPEKEVLMWKFDSRLAFHHMARELHPEYYKNC*LRAIYKGLSAGDFPGRRGLGGTGEWRALRCCI*AAAFCLYWVSLVRPDLSLGALWLAREPTA*ASIKLALSALSSVCPSVV*LW*LEIPQTLLVSVENL*QWRPNRDLKAKEKPEELSRRRTRLAEARTARGEGRRLVSTPKILTSGG*KERDGCESVSIKCGRIRQMGKNSVKARGKEKI*IKTYSMGKQGARTIRS*SWPVRNIRRL*TNTGTATTIPSDRIRRT*III*YNSNPLLCASKDRGKRHQGSFREGRGRAKQK*EKGTASSS*HRKQQPGQPKLPYSAEHPGANGTSGHIT*NFKCMGKSSRREGFQPRSNTHVFSIIRRSHPTRFKHHAKHSGGTSSSHANVKRDHQ*GSCRMG*IAPSACRAYCTRPDERAKGK*HSRNY*YPSGTNRMDDK*STYPSRRNL*KMDNHGIK*NSKDV*SYQHSGHKTRTKGTL*RLCRSVL*NSKSRASFTGGKKLDDRNLVGPKCEPRL*DYFESIGTSRYIRRNDDSMSGSGRTRP*SKSFGGSNEPSNKFSYHNDAERQF*EPKKEC*VFQLWQRRAHSQKLQGP*EKGLLEMWKGRTPNERLY*ETG*FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,GAAGGGCTAATTTGGTCCCAGAAAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCGGGGACCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGAGAAGGTAGAAGAGGCCAATGCAGGAGAGAACAACAGCTTGTTACACCCTATAAGCCTGCATGGGATGGAGGACCCGGAGAAAGAAGTGTTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAATTGCTGACTTCGAGCTATCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGAGGCGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACGGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCAAAAATTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,gag,789,2291,789,2291,forward,0.19470123431286457,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ,MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGTGCGGGAGAATTAGACAAATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATATAGTATGGGCAAGCAGGGAGCTAGAACGATTCGCAGTTAATCCTGGCCTGTTAGAAACATCAGAAGGCTGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAGATCATTATATAATACAATAGCAACCCTCTATTGTGTGCATCAAAAGATAGAGGTAAAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGCAGCAGCTGACACAGGAAACAACAGCCAGGTCAGCCAAAATTACCCTATAGTGCAGAACATCCAGGGGCAAATGGTACATCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAGACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCACCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAGCCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCATGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGACATAAGACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGATCGGTTCTATAAAACTCTAAGAGCCGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATGCGAACCCAGATTGTAAGACTATTTTGAAAGCATTGGGACCAGCCGCTACATTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTTTTGGCGGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAAAGGCAATTTTAGGAACCAAAAAAGGAATGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAGAAATTGCAGGGCCCCTAGGAAAAGGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAGAGACAGGCTAATTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692074,pol,2084,4114,2084,5095,forward,0.5617851221088768,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,TTTTTTAGGGAAGATCTGGCCTTCCCACAAGGGAAGGCCAGGGAATTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCGCTCAGAAGCAGGAGCCGATAGACAAGGAACTGTATCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAGGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAATTTGCCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACTCATAGAAATCTGTGGACATAAAGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGATTGGTTGCACTTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCCATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGACTTCTGGGAAGTTCAATTAGGAATACCACATCCCGCAGGGTTAAGAAAGAAAAAATCAGTAACAGTACTGGATGTGGGGGATGCATATTTTTCAGTTCCCTTAGATAAAGAATTTAGGAAATATACTGCATTTACCATACCCAGTAGAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATTTTAGAGCCTTTTAGAAAACAAAATCCAGAAATAGTTATCTATCAATACATGGATGATTTATATGTAGGATCTGATTTAGAAATAGGGCAGCATAGAATAAAAATAGAGGAACTGAGACAACATCTGTTGAGATGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCCCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTGAATTGGGCAAGTCAGATTTACCCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAAATAGTACCACTAACAAAAGAAGCAGAGCTGGAACTGGCAGAAAACAGGGAAATTCTAAAAGAACCAGTACATGGAGTATATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGTCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAAAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vif,3617,4114,5040,5618,forward,0.7631664499349805,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpr,3617,4114,5558,5848,forward,0.7629151983204618,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,vpu,3617,4114,6060,6308,forward,0.7634058115037564,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI,MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI*,ATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAACCACAGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAAACTACCCATACAAAAAGAAACATGGGAAGCATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATACCCAGTGGCGAGCCCTCAGATGCTGCATATAA +MN692074,tat_exon1,3823,4083,5829,6044,forward,0.7659115426105717,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,rev_exon1,3823,4083,5968,6045,forward,0.7610789980732178,MVPVRERTHSRSRNLLCRWGS,MVPVRERTHSRSRNLLCRWGS*QGD*IRKSRICY*QRKTKSCLPN*HNKSED*ITSNSSSFAGFGIRSKHSNRLTICIRNHSSTTRY,ATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAACAGGGAGACTAAATTAGGAAAAGCAGGATATGTTACTAACAGAGGAAGACAAAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAC +MN692074,tat_exon2,4080,4163,8375,8470,forward,0.769292994661058,IPSGEPSDAAYKQLLFACTGSLWLDQI,IPSGEPSDAAYKQLLFACTGSLWLDQI*,ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGA +MN692074,rev_exon2,4081,4152,8376,8651,forward,0.7667894365645325,YPVASPQMLHISSCFLPVLGLSG,YPVASPQMLHISSCFLPVLGLSG*,TACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAG +MN692145,gag,775,2280,789,2291,forward,0.20784453738651432,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ,MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ*,ATGGGTGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGAACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGGACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGTAGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGATAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACACAGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAATGGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAAGGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTACCCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCATTCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAAAACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGTCTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAATTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGCCAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCAAATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAA +MN692145,pol,2070,5084,2084,5095,forward,0.14843087362171337,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED,FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCCCACAAGGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGAACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGGACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATTGGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATACCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAAGGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTCAATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATCAAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAAGGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAAATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAAGCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAATCAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACTGGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAATACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTAGACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGACAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGGATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAATAGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN692145,vif,5029,5607,5040,5618,forward,0.2608047690014903,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH,MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTATGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGACCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCATATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCCTAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAG +MN692145,vpr,5547,5837,5558,5848,forward,0.3566796368352788,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS,MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACCGAGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTTAGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCATTTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAATGGAGCCAATAGATCCTAG +MN692145,tat_exon1,5818,6036,5829,6044,forward,0.28735632183908044,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ,MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ*,ATGGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGCTTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA +MN692145,rev_exon1,5957,6037,5968,6045,forward,0.4274965800273598,MAGRSGDSDEELLKTVRLIKFLYQSSK,MAGRSGDSDEELLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAG +MN692145,vpu,6049,6297,6060,6308,forward,0.520618556701031,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL,MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL*,ATGAACTCTTTACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTCTATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAG +MN692145,env,6212,8782,6223,8793,forward,0.4766895145301081,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL,MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL*,ATGAGAGTGAAGGGGATCAGGAAGAACTATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCACCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTAGTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAAATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAGGAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAGAATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTAATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAAAAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAAAGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGTGTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAGAAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTACAGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGGTTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAGCACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAATTAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAGAAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAACTGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGGGAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGTTGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGACCTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAAGAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAGTCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATCAACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTTGGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGGAGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGCAGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGTGGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAGGAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTATAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGGGCTTTGAAAGGGCTTTGCTATAA +MN692145,tat_exon2,8364,8459,8375,8470,forward,0.3921568627450981,RPASQPRGDPTGPKESKKKVERETETDPLH,RPASQPRGDPTGPKESKKKVERETETDPLH**,AGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +MN692145,rev_exon2,8365,8640,8376,8651,forward,0.29843322556577967,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE,DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE*,GACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGAAAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACCGCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATAG +MN692145,nef,8784,9386,8795,9415,forward,0.3966849799795139,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC,MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC*,ATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGATGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCAGTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAATGCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACTACAAGAACTGCTGA +MN090335,gag,315,1664,789,2291,forward,0.596665989022159,MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ,MYTIEGGYCII**SKFF*SCLKGWL*LFQYLFTAS*CF*QARINCESF*FPACPYYMF*SIFFLSPWP*PNFLPSI*FSPAQY*RSRTHLSPSSLR*SKMAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ*,ATGTACACAATAGAGGGTGGCTACTGTATTATATAATGATCTAAGTTCTTCTGATCCTGTCTGAAGGGATGGTTGTAGCTGTTCCAATATCTGTTTACAGCCTCCTGATGTTTCTAACAGGCCAGGATTAACTGCGAATCGTTCTAGTTCCCTGCTTGCCCATACTATATGTTTTAATCTATATTTTTTCTTTCCCCCTGGCCTTAACCGAATTTTCTCCCATCTATCTAATTCTCCCCCGCTCAATACTGACGCTCTCGCACCCATCTCTCTCCTTCTAGCCTCCGCTAGTCAAAAATGGCGTACTCACCAGTCGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAAGCCACCCCACAAGATTTGAACACTATGCTAAACACAGTGGGTGGACACCAAGCAGCTATGCAAATGTTAAAAGAGGTCATCAATGAGGAAGCTGCAGAATGGGATAGATTACATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGGATGGATGACACATAATCCACCTATCCCAGTAGGAGAGATTTATAAAAGATGGATAATTCTGGGACTAAATAAAATAGTAAGAATGTATAGCCCTACCAGCATTTTGGACATAAAGCAAGGGCCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAAAACTTTAAGAGCCGAGCAAGCTACACAGGAAGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAGAATGCAAATCCAGATTGTAAAACTATTTTAAAAGCATTAGGACCAGCAGCTACACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGGGGACCCGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGCAACAGGTACAGCCAACATACTGATGCAGAGAGGCAATTTTAGGAACCAAAGAAAGCCTGTTAAATGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAGGGAAGGACACCAAATGAAGGATTGCACTGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAA +MN090335,pol,1427,4468,2084,5095,forward,0.27887169154684477,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED,FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED*,TTTTTTAGGGAAAATCTGGCCTTCTCACAAGGGAAGGCCAGGGAACTTTCCTCAGAGCCGACCAGAAATTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCCCCTCCAGAAGAGAGCTTCAGGTTTGGGGAAGCAACAACTCCCTCTCAGAAGCAGGAGACAATGGACAAGGAGCTGTATCCTCCTCTAACTTCCCTCAGATCACTCTTTGGCAACGACCCATCGTCACAATAAAGATAGGGGGGCAACTAAAGGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAGGACATAGATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAATATGAACAGGTACCCATAGAAATTAGCGGACACAAAGCTATAGGTACAGTGTTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGCACTCTAAATTTTCCCATCAGCCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGACGGCCCAAAGGTTAAACAATGGCCATTAACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTGTTTGCCATAAAGAAAAAAGATGGCACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTTAATAAGAGAACTCAAGAATTCTGGGAAATTCAATTAGGTATACCACATCCTGCAGGGCTAAAAAAGAAAAAATCAGTCACAGTACTGGATGTGGGTGATGCATATTTTTCAGTTCCCTTAGATAAAGACTTCAGGAAATATACTGCATTTACCATACCTAGTATAAACAATGAGACACCAGGGATTAGATATCAGTATAATGTGCTTCCACAAGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAGATCCTGGAGCCTTTTAGAAAGACAAATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAACATAGAACAAAAGTAGAGGAACTGAGGCAACATCTGATGAGGTGGGGATTTACCACACCAGACAAAAAGCACCAGAAAGAACCCCCATTCCTTTGGATGGGGTATGAACTCCATCCTAATAAATGGACAGTACAGCCTATAGTACTGCCAGAAAAGGAAAGTTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTATGCAGGGATTAAAGTGAAGCAATTATGTAAGCTCCTTAGGGGAACCAAAGCATTAACAGAAGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTCTAAAAGATCCGGTACATGGAGCATATTATGACCCAGCAAAGGACTTAATAGCAGAACTACAGAAGCAGGGAGAAGGTCAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGGAAATATGCAAGAACGAGGGGTGCCCATACTAATGATGTAAAGCAATTAACAGAGGCAGTGCAAAAAATATCCACAGAAAGTATAGTAATATGGGGAAGGACTCCTAAATTTAGATTACCCATACAAAAAGAAACATGGGAAACATGGTGGACAGATTATTGGCAAGCCACCTGGATCCCTGAGTGGGAGTTTGTCAACACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAAAAAGAACCCATAATAGGAGCAGAAACCTTCTATGTAGATGGGGCAGCTAATAGGGATAATAAATCAGGAAAAGCAGGATATGTTACTGATAGAGGAAGACAAAAGGTTGTCACCATAAATGACACAACAAATCAGAAAACTGAATTACAAGCCATTCATCTAGCCTTGCAGGATTCGGGGCTAGAAGTAAACATAGTAACAGACTCACAGTATGCATTAGGGATCATTCAAGCACAACCAGATAAAAGTGAATCAGAGTTAGTCAGTCAAATAATAGAACAGTTAATAAAAAAGGAAAAGGTCTACCTGGCATGGGTGCCAGCCCACAAAGGAATTGGAGGAAATGAACAGGTAGATAAACTAGTCAGTGCTGGAATCAGGAAAGTACTATTTTTAGATGGAATAGAAAAAGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAACAATGGCTAGTGATTTTAACCTACCACCTATAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCTATGCATGGGCAAGTAGACTGTAGTCCAGGTATATGGCAGCTAGATTGTACACATTTAGAAGAAAAAATTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTGATTCCAGCAGAGACAGGGCAAGAAACAGCATACTTTATTTTAAAACTAGCAGGAAGATGGCCAGTAAAAACAATACATACAGACAATGGCCGCAATTTCACCAGTAATACAGTGAAGGCCGCCTGTTGGTGGGCGGGAATCAAGCAGGAATTTGGTATTCCCTACAATCCCCAGAGTCAAGGAGTAGTAGAATCTATGAATAATGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGATACAGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGAAATACAGACTAAAGAATTACAAAAACAAATTACAAAAATTCCAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAACAGTGACATAAAAGTAGTGCCAAGAAGAAAAGCAAAAATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAG +MN090335,vif,4413,4991,5040,5618,forward,0.3566796368352788,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH,MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH*,ATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTTAGTAAAATACCATATGTATATTTCAAAGAAAGCCAAAAAATGGGCTTATAGACACCATTACGAAACCACTCATCCAAGAATAAGTTCAGAAGTACATATCCCACTAGGGGATGATAGATTGGTAATAACAACATATTGGGGTCTGCATACAGGAGAGAGAGACTGGCATTTGGGCCAGGGAGTCTCCATAGAATGGAGAAAAAGGAGATATAGCACACAAGTAGACCCTGACTTAGCAGACCATCTAATTCATGTGCATTATTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATAGAGTTAGCCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGATCTCTACAATACTTGGCACTAACAGCAGTAATAACACCAAAGAAGATAAAGCCACCTTTGCCTAGTGTAAAGAAACTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAG +MN090335,vpr,4931,5221,5558,5848,forward,0.3808935556928146,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS,MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS*,ATGGAACAAGCCCCAGAAGACCAAGGGCCACAGAGAGAGCCATACAATGAATGGACACTAGAGCTTTTAGAAGAGCTTAAGAGAGAAGCTGTTAGACATTTCCCTAGACCATGGCTACAAGACCTAGGACAATATATCTATGAAACTTATGGGGATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAAATGCTGTTTATTCATTTCAGAATTGGGTGTCACCATAGCAGAATAGGCATTGTTCTGCAAAGAAGAGCAAGAAATGGAGCCAGTAGATCATAG +MN090335,tat_exon1,5202,5417,5829,6044,forward,0.40192926045016075,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ,ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG +MN090335,rev_exon1,5341,5421,5968,6045,forward,0.524971623155505,MAGRSGDRDEDLLKTVRLIKFLYQSSK,MAGRSGDRDEDLLKTVRLIKFLYQSSK,ATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAAG +MN090335,vpu,5433,5681,6060,6308,forward,0.5244381020335356,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL,MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL*,ATGCAATCTTTAGAGATATTAGCAATAGTAGCATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTAGGCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAAAATAATTAATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAG +MN090335,env,5596,8157,6223,8793,forward,0.5152420275849952,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ,MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ*,ATGAGAGCGAAGGGGATCAGGAAGAATTGTCAGCACTTGTGGTGGAAATGGGGCACGATGCTCCTTGGGATGTTGATGATCTGTAGTGCTGCGGAAAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAGAGATGCAAATACCACTCTATTCTGTGCATCAGATGCTAAAGCATATGATACAGAAGTACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCTAACCCACATGAAGTAGAATTGAAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTGGACCAGATGCATGAGGATATAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGCAAAATTGACCCCACTCTGTGTTACTTTAAATTGCACTGATTTAAGAAATGATACTGTAGGAAATCAAACAAATCTCACTGAAACTAATACAATACAGGGAAGAGAAATGACAAACTGCTCTTTCAATATCACCACAGAGATAAGAGATAAAGTGCGAAAAGAACATGCACTTTTTTATAAACTTGATGTCATGCCAATAGATAGGGATAATACAAGTTATACATTGATAAATTGCAATACCTCAGTCATTACACAGGCCTGTCCAAAGGTAACCTTTGAACCAATTCCCATACATTATTGTACTCCAGCTGGTTTTGCAATTCTAAAGTGTAAGGATGAGATGTTCAATGGAACAGGACCATGTAAGAATGTCAGCACAGTACAATGTACACATGGAATTAGACCAGTAGTGTCAACTCAACTACTGTTAAATGGTAGCCTAGCAGAAAAAGAGATAGTACTTAGATCTGAAAATTTCACAGACAATGGTAAAAATATAATAGTACAGCTAAATAGATCTATAGTAATTAATTGTACAAGACCCAACAACAATACAAGAAAAAGTATAAGTGTAGCAGGGAGAGCAATTTATGCAACAGGGCAGATAATAGGAGATATAAGACAAGCACATTGTAACATCAGTGAGACAGATTGGAATGACACTTTAAGCAAAATAGTTGAAAAATTAAGGGAAAAATTTGGAAAAGATAAAACAATAATCTTTAATCAATCATCAGGAGGGGACATGGAAATTGAAACGCACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAACACAACACGACTGTTTAATAGTACTTGGAGTGTTAATGGAACTAGCATAAACGGAACTAAAAATATCACACTCCCGTGCAGAATAAAACAAATTATAAACAGGTGGCAGGAAGTAGGAAAAGCAATGTATGCCCCTCCTATCAGTGGGATAATTAGGTGCTCATCAAATATTACAGGACTAATATTAACAAGAGATGGTGGTACAAATAATAGTACAGAGGAGACGGAGACCTTCAGACCTGGAGGGGGAAATATGAAGGACAATTGGAGAAGTGAATTATATAAATACAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAAGGCACAGAGAAGAGTGGTGCAGAGAGAAAAAAGAGCAATAGGAGCGTTAGGAGCTATGTTCCTCGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCACTGACGCTGACGGTACAAGCCAGACAATTATTGTCTGGTATAGTGCAACAGCAGAACAATCTGCTGAGGGCTATTGAGGCGCAACAGCATATGTTGCAACTCACAGTCTGGGGCATCAAACAGCTCCAGGCAAGAGTCCTGTCTGTGGAAAGATACCTACAGGATCAACAGCTCCTGGGGATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTACTGTGCCTTGGAATACTAGTTGGAGCAATAAATCTTACGATACCATCTGGGATAACATGACCTGGATGCAGTGGGACAGAGAAATTCAAAATTACACAGGGAAAATATACAACTTACTTGAGGAATCGCAAATCCAACAGGAAAAGAATGAAAAGGAATTATTAGAACTAGATCAATGGGCAAATTTGTGGAATTGGTTTAGTATAACAAAATGGCTGTGGTATATAAAAATATTCATAATGATAGTAGGAGGCTTAGTAGGTTTAAAAATAATTTTTGCTGTATTTTCTATAGTGAATAGAGTTAGGCAGGGATACTCACCATTATCATTGCAGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAGTGCTGTTAGCTTGCTCAATACCATAGCTATCGCAGTAGCTGAGGGAACAGATAGGGTTATAGAGGTAGGACAAAGAATTGGCAGAGCTTTTCTCCACATACCTAGAAGGATAAGACAGGGATTAGAAAGGGCTTTGCAATAA +MN090335,tat_exon2,7739,7834,8375,8470,forward,0.6842105263157894,RPSSQPRGDQTGPKE,RPSSQPRGDQTGPKE*KKKVERETEADPED**,AGACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGA +MN090335,rev_exon2,7740,8015,8376,8651,forward,0.4267425320056898,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE,DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE*,GACCCTCCTCCCAACCCCGAGGGGACCAGACAGGCCCGAAGGAATAGAAGAAGAAGGTGGAGAGAGAGACAGAGGCAGATCCGGAAGATTAGTGACTGGATTCTTACCACTCATCTGGGACGACCTGCGGAGCCTGTGCCTCTTCAGCTACCACCACTTGAGAGACTTACTCTTGATTGTGCTGAGGACTGTGCAAGTTCTGGGACACAGGGGGTGGGAGATCCTCAAGTACTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAACTAAAGAATAG +MN090335,nef,8159,8812,8795,9415,forward,0.4891015417331206,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC,MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC*,ATGGGTGGCAAGTGGTCAAAAGGTTGTATGGCTGGATGGCCTACTGTAAGGGAAAGAATGGAAAGAATTGATCCAAGGCCTGCTGCAAGGAGGGAACAAGCTGAGCCAGCAGCAGCTGGGGTAGGAGCAGCATCTCGAGACTTGGAAAAATATGGAGCAATCACAAGTAGCAATACATCAACTACTAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAAGTAGGCTTTCCAGTCAGACCTCAGGTACCTTTAAGACCAATGACTTACAAAGCAGCTTTGGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTGGTCCCAGAGAAGACAAGAAATCCTTGATTTGTGGGTTTACCACACACAAGGATACTTCCCTGATTGGCAAAACTACACACCAGGACCAGGGGTCAGATTTCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGATCCAGACCAAGTAGAGAAGGCCAATGAAGGAGAGAACAACTGCTTGCTACACCCTATGAGCCTGCATGGGATGGAAGACTCAGAGGGAGAAGTGTTAATGTGGAAGTTTGACAGCAGCCTGGCGTTTCATCATAGAGCCCGAGAACAACATCCGGAGTACTACAAAGACTGCTGA diff --git a/tests/expected-results-small/errors.json b/tests/expected-results-small/errors.json index e0159fe..0f52eb6 100644 --- a/tests/expected-results-small/errors.json +++ b/tests/expected-results-small/errors.json @@ -3,52 +3,52 @@ { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 2721" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 2721" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6322" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6322" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum insertions 90, got 909" + "message": "Smaller ORF vif at 5040-5618 can have maximum insertions 90, got 909" }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum deletions 30, got 66" + "message": "Smaller ORF vpr at 5558-5848 can have maximum deletions 30, got 66" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "KX505501.1", "error": "InternalStopInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6046 contains an internal stop codon at 6004" + "message": "Smaller ORF rev_exon1 at 5968-6045 contains an internal stop codon at 6004" }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains out of frame indels that impact 189 positions." + "message": "Smaller ORF vpu at 6060-6308 contains out of frame indels that impact 190 positions." }, { "sequence_name": "KX505501.1", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 51 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 51 positions." }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 96" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 96" }, { "sequence_name": "KX505501.1", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 867" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 867" }, { "sequence_name": "KX505501.1", @@ -70,59 +70,59 @@ { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon at 6123" + "message": "Smaller ORF vpu at 6060-6308 contains an internal stop codon at 6123" }, { "sequence_name": "MN691959", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" } ], "MN692074": [ { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "ORF pol at 2084-5096 can have maximum deletions 30, got 981" + "message": "ORF pol at 2084-5095 can have maximum deletions 30, got 981" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "ORF env at 6223-8794 contains an internal stop codon at 6550" + "message": "ORF env at 6223-8793 contains an internal stop codon at 6550" }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" + "message": "Smaller ORF vif at 5040-5618 can have maximum deletions 30, got 81" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" + "message": "Smaller ORF vpr at 5558-5848 can have maximum insertions 90, got 207" }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6045 contains an internal stop codon at 5892" + "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon at 5892" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" + "message": "Smaller ORF vpu at 6060-6308 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains out of frame indels that impact 40 positions." + "message": "Smaller ORF tat_exon2 at 8375-8470 contains out of frame indels that impact 40 positions." }, { "sequence_name": "MN692074", "error": "DeletionInOrf", - "message": "Smaller ORF rev_exon2 at 8376-8652 can have maximum deletions 30, got 204" + "message": "Smaller ORF rev_exon2 at 8376-8651 can have maximum deletions 30, got 204" }, { "sequence_name": "MN692074", "error": "InsertionInOrf", - "message": "Smaller ORF nef at 8795-9416 can have maximum insertions 90, got 882" + "message": "Smaller ORF nef at 8795-9415 can have maximum insertions 90, got 882" }, { "sequence_name": "MN692074", @@ -140,12 +140,12 @@ { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "ORF gag at 789-2292 contains an internal stop codon at 822" + "message": "ORF gag at 789-2291 contains an internal stop codon at 822" }, { "sequence_name": "MN090335", "error": "InternalStopInOrf", - "message": "Smaller ORF tat_exon2 at 8375-8471 contains an internal stop codon at 8420" + "message": "Smaller ORF tat_exon2 at 8375-8470 contains an internal stop codon at 8420" }, { "sequence_name": "MN090335", diff --git a/tests/expected-results-small/holistic.json b/tests/expected-results-small/holistic.json index b652f68..b806eda 100644 --- a/tests/expected-results-small/holistic.json +++ b/tests/expected-results-small/holistic.json @@ -6,9 +6,9 @@ "blast_matched_qlen": 1997, "blast_sseq_coverage": 0.2498456472525211, "blast_qseq_coverage": 1.2158237356034052, - "blast_sseq_orfs_coverage": 0.17663960024984385, + "blast_sseq_orfs_coverage": 0.17666166916541728, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN691959": { @@ -20,7 +20,7 @@ "blast_qseq_coverage": 1.1086063415148004, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN692074": { @@ -30,9 +30,9 @@ "blast_matched_qlen": 4178, "blast_sseq_coverage": 0.5042189750977567, "blast_qseq_coverage": 1.1728099569171853, - "blast_sseq_orfs_coverage": 0.4114928169893816, + "blast_sseq_orfs_coverage": 0.411544227886057, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 4 }, "MN692145": { @@ -44,7 +44,7 @@ "blast_qseq_coverage": 1.1271545051088863, "blast_sseq_orfs_coverage": 1.0, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 }, "MN090335": { @@ -54,9 +54,9 @@ "blast_matched_qlen": 9069, "blast_sseq_coverage": 0.9842560197571517, "blast_qseq_coverage": 1.0603153600176425, - "blast_sseq_orfs_coverage": 1.0003747657713928, + "blast_sseq_orfs_coverage": 1.000374812593703, "orfs_start": 789, - "orfs_end": 8794, + "orfs_end": 8793, "blast_n_conseqs": 3 } } \ No newline at end of file diff --git a/tests/expected-results-small/orfs.json b/tests/expected-results-small/orfs.json index 0e30b50..5b0bf90 100644 --- a/tests/expected-results-small/orfs.json +++ b/tests/expected-results-small/orfs.json @@ -3,9 +3,9 @@ { "name": "env", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.7623480451210163, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -15,9 +15,9 @@ { "name": "vif", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7647696476964769, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -27,9 +27,9 @@ { "name": "nef", "start": 0, - "end": 1824, + "end": 1823, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.764345579086969, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -39,9 +39,9 @@ { "name": "tat_exon1", "start": 1, - "end": 1750, + "end": 1749, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7680130480667754, "protein": "MRKLQNGIDCIQCMQGLLHQAR", @@ -51,9 +51,9 @@ { "name": "gag", "start": 336, - "end": 1824, + "end": 1823, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.3997973809613161, "protein": "MGARASVLSGGELDRWEKIRLRPGGNKRYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPTLKTGSEELKSLYNTIAVLYCVHQKIDVKDTKEALDKIEEEQNKIRKQAQQTAAAGSSSQVSHNYPVVQNHQGQMVYQALSPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIAWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPVSILDIRQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPSHKARVLAEAMSQMTNSATVMMQKGNFRNQRKTVKCFNCGKEGHIARNCRAPRKKGCWKCGREGHQMKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -63,9 +63,9 @@ { "name": "rev_exon1", "start": 1306, - "end": 1750, + "end": 1749, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.758082497212932, "protein": "MRTQIVKLF", @@ -75,9 +75,9 @@ { "name": "vpr", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.763687959047407, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -87,9 +87,9 @@ { "name": "vpu", "start": 1599, - "end": 1824, + "end": 1823, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7672672672672673, "protein": "MKDCTERQANFVGKIWPSHKGRPGNFLQNRPEPTAPPAESFRFGEETPTRCIRSTTRTADTELFTRDFPLGTFQ", @@ -99,9 +99,9 @@ { "name": "pol", "start": 1627, - "end": 1927, + "end": 1926, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.7724330674761569, "protein": "GKSGLPTREGRGISFRTDQSQQPHQQRASGLGKRHQLDASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -111,9 +111,9 @@ { "name": "tat_exon2", "start": 1746, - "end": 1824, + "end": 1823, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.7616257781032589, "protein": "RCIRSTTRTADTELFTRDFPLGTFQ", @@ -123,9 +123,9 @@ { "name": "rev_exon2", "start": 1747, - "end": 1927, + "end": 1926, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7620186257236345, "protein": "DASGVLQGLLTLSFSQGTFRWGLSSRGVAWAGLGSGEPSDAAYKQLLSACTRSLWLDQI", @@ -137,9 +137,9 @@ { "name": "gag", "start": 639, - "end": 2142, + "end": 2141, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.0801186943620179, "protein": "MGARASVLSGGELDRWEKIRLRPGGKKKYKLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTVATLYCVHQRIEIKDTKEALEKIEEEQNKSKKKAQQAAADTGHSNQISQNYPIVQNIQGQVVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNXXXPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRNQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKECTERQANFLGKIWPSYKGRPGNFLQSRPEPTAPPEESFRSGVETTTPSQKQEPIDKELYPLTSLRSLFGNDPSSQ", @@ -149,9 +149,9 @@ { "name": "pol", "start": 1934, - "end": 4946, + "end": 4945, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.054722889368558514, "protein": "FFREDLAFLQGKAREFSSEQTRANSPTRRELQVWGRDNNSLSEAGADRQGTVSFNFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGLTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTRALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKITTESIVIWGKTPRFKLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNKGRQKVVPLTNTTNQKTELQAIYLALQDSGLEVNIVTDSQYALGIIQAQPDQSESELVNQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKILFLDGIDKAQDEHEKYHSNWRAMASDFNLPPVVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSATVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -161,9 +161,9 @@ { "name": "vif", "start": 4890, - "end": 5469, + "end": 5468, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKARGWFYRHHYERTHPRISSEVYIPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPELADQLIHLYYFDCFSDSAIRKALLGHIVSPRCEYQAGHNKVGSLQYLALAALITPKKIKPPLPSVTKLTEDRWNKPQKTKGHRGSHTMNGH", @@ -173,9 +173,9 @@ { "name": "vpr", "start": 5408, - "end": 5699, + "end": 5698, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.09157509157509158, "protein": "MEQAPEDQGPQREPHNEWTLELLEELKNEAVRHFPRIWLHGLGQHIYETYGDTWAGVEAIIRILQQLLFIHFRIGCRHSRIGVTQQKRARNGASRS", @@ -185,21 +185,21 @@ { "name": "tat_exon1", "start": 5679, - "end": 5898, + "end": 5894, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", - "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ*", - "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAA" + "aminoacids": "MEPVDPRLEPWKHPGSQPKTACTTCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRPPQDSQTHQVSLSKQ", + "nucleotides": "ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAAAACTGCTTGTACCACTTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATGACAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGACCTCCTCAAGACAGTCAGACTCATCAAGTTTCTCTATCAAAGCAG" }, { "name": "rev_exon1", "start": 5818, - "end": 5899, + "end": 5898, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4807692307692307, "protein": "MAGRSGDSDEDLLKTVRLIKFLYQSSK", @@ -209,9 +209,9 @@ { "name": "vpu", "start": 5910, - "end": 6156, + "end": 6155, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7333193453629878, "protein": "MQPIQIAIVALVVAIIIAIVV", @@ -221,9 +221,9 @@ { "name": "env", "start": 6070, - "end": 8656, + "end": 8655, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.1405525502318391, "protein": "MRVKEKCQHLWRWGWRWGTMLLGILMICSATEKLWVTVYYGVPVWKEATTTLFCASDAKAYDAEVHNVWATHACVPTDPNPQEVVLVNVTENFNMWKNDMVEQMHEDIISLWDQSLKPCVKLTPLCVSLKCTDLGNATNTNSSNTNSSSGEMMMEKGEIKNCSFNISTSIRNKVQKEYAFFYKLDIVPIDNDTTSYTLTSCNTSVITQACPKVSFEPIPIHYCAPAGFAILKCNNKTFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEDVVIRSANFTDNAKTIIVQLNQSVEINCTRPNNNTRKSIRIQRGPGRAFVTIGKIGNMRQAHCNISRAKWNATLKQIASKLREQFGNNKTIIFKQSSGGDPEIVTHSFNCGGEFFYCNSTQLFNSTWFNSTWSTEGSNNTEGSDTITLPCRIKQFINMWQEVGKAMYAPPISGQIRCSSNITGLLLTRDGGNNNNGSEIFRPGGGDMRDNWRSELYKYKVVKIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGAASMTLTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGIKQLQARILAVERYLKDQQLLGIWGCSGKLICTTAVPWNASWSNKSLEQIWNNMTWMEWDREINNYTSLIHSLIEESQNQQEKNEQELLELDKWASLWNWFNITNWLWYIKLFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTHLPNPGGPDRPEGIEEEGGERDRDRSIRLVNGSLALIWDDLRSLCLFSYHRLRDLLLIVTRIVELLGRRGWEALKYWWNLLQYWSQELKNSAVSLLNATAIAVAEGTDRVIEVVQGAYRAIRHIPRRIRQGLERILL", @@ -233,9 +233,9 @@ { "name": "tat_exon2", "start": 8237, - "end": 8333, + "end": 8332, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6672629695885509, "protein": "RPTSQTRGDPTGPKE", @@ -245,9 +245,9 @@ { "name": "rev_exon2", "start": 8238, - "end": 8514, + "end": 8513, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.210025203024363, "protein": "DPPPKPGGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTILESGAKE", @@ -257,9 +257,9 @@ { "name": "nef", "start": 8657, - "end": 9278, + "end": 9277, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.06582796957284964, "protein": "MGGKWSKSSVIGWPTVRERMRRAEPAADGVGAASRDLEKHGAITSSNTAATNAACAWLEAQEEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQRRQDILDLWIYHTQGYFPDWQNYTPGPGIRYPLTFGWCYKLVPVEPDKVEEANKGENTSLLHPVSLHGMDDPEREVLEWRFDSRLAFHHVARELHPEYFKNC", @@ -271,9 +271,9 @@ { "name": "nef", "start": 0, - "end": 4059, + "end": 4058, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.7628009106462086, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -283,9 +283,9 @@ { "name": "env", "start": 2, - "end": 4115, + "end": 4114, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.76033143808071, "protein": "MNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -295,9 +295,9 @@ { "name": "gag", "start": 789, - "end": 2292, + "end": 2291, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.19470123431286457, "protein": "MGARASVLSAGELDKWEKIRLRPGGKKKYRLKHIVWASRELERFAVNPGLLETSEGCRQILGQLQPSLQTGSEELRSLYNTIATLYCVHQKIEVKDTKEALEKVEEEQNKSKKKAQQAAADTGNNSQVSQNYPIVQNIQGQMVHQAISPRTLNAWVKVVEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIIMGLNKIVRMYSPTSILDIRQGPKEPFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQKGNFRNQKRNVKCFNCGKEGHIARNCRAPRKRGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPAQKQEPIDKELYPLASLRSLFGNDPSSQ", @@ -307,9 +307,9 @@ { "name": "pol", "start": 2084, - "end": 4115, + "end": 4114, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.5617851221088768, "protein": "FFREDLAFPQGKAREFPSEQTRANSPTRRELQVWGRDNNSRSEAGADRQGTVSFSFPQITLWQRPLVTIRIGGQLKEALLDTGADDTVLEEMNLPGRWKPKMIGGIGGFIKVRQYDQILIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLRKKKSVTVLDVGDAYFSVPLDKEFRKYTAFTIPSRNNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKQNPEIVIYQYMDDLYVGSDLEIGQHRIKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKDSWTVNDIQKLVGKLNWASQIYPGIKVRQLCKLLRGTKALTEIVPLTKEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYAKMRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -319,9 +319,9 @@ { "name": "vif", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.7631664499349805, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -331,9 +331,9 @@ { "name": "vpr", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.7629151983204618, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -343,9 +343,9 @@ { "name": "vpu", "start": 3617, - "end": 4115, + "end": 4114, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.7634058115037564, "protein": "MRGAHTNDVKQLTEAVQKITTESIVIWGKTPKFKLPIQKETWEAWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGAANRETKLGKAGYVTNRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDTQWRALRCCI", @@ -355,9 +355,9 @@ { "name": "tat_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.7659115426105717, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -367,9 +367,9 @@ { "name": "rev_exon1", "start": 3823, - "end": 4084, + "end": 4083, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.7610789980732178, "protein": "MVPVRERTHSRSRNLLCRWGS", @@ -379,9 +379,9 @@ { "name": "tat_exon2", "start": 4080, - "end": 4164, + "end": 4163, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.769292994661058, "protein": "IPSGEPSDAAYKQLLFACTGSLWLDQI", @@ -391,9 +391,9 @@ { "name": "rev_exon2", "start": 4081, - "end": 4153, + "end": 4152, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.7667894365645325, "protein": "YPVASPQMLHISSCFLPVLGLSG", @@ -405,9 +405,9 @@ { "name": "gag", "start": 775, - "end": 2281, + "end": 2280, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.20784453738651432, "protein": "MGARASVLSGGKLDQWEKIRLRPGGKKKYQLKHIVWASKELERFAVNPGLLETTEGCRQILGQLQPSLQTGSEELKSLYNTVATLYCVHQRIDVKDTKEALDKIEEEQNKSKEKAKQAAADTGNSNQVSQNYPIVQNLQGQMVHQAISPRTLNAWVKVIEEKAFSPEVIPMFSALSEGATPQDLNTMLNTVGGHQAAMQMLKETINEEAAEWDRVHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTNNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIRQGPKESFRDYVDRFYKTLRAEQASQEVKNWMTETLLVQNSNPDCKTILKALGPGATLEEMMTACQGVGGPGHKARVLAEAMSQVTNSATIMMQRGNFRSQRKIVKCFNCGKEGHIARNCRAPRKKGCWKCGKEGHQMKDCTERQANFLGKIWPSHKGRPGNFLQSRPEPTAPPEESFRFGEETTTPSQKQESTGKELYPPLASLRSLFGNDPSSQ", @@ -417,9 +417,9 @@ { "name": "pol", "start": 2070, - "end": 5085, + "end": 5084, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.14843087362171337, "protein": "FFRENLAFPQGEARKFPSEQARANSPTRRELQVWGRDNNSLSEAGVDRQGTVSSFSFPQITLWQRPLVTIKIGGQLKEALLDTGADDTVLEEMSLPGRWKPKMIGGIGGFIKVRQYDQISIEICGHKAIGTVLVGPTPVNIIGRNLLTQIGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALTEICTEMEKEGKISKIGPENPYNTPVFAIKKKDSTKWRKLVDFRELNKRTQDFWEVQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDEDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQCSMTKILEPFRKQNPDIVIYQYMDDLYVGSDLEIGQHRTKIEELRQHLLRWGFTTPDKKHQKEPPFLWMGYELHPDKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGAKALTEVIPLTEEAELELAENREILKEPVHGVYYDPSKDLIAEIQKQGQGQWTYQIYQEPFKNLKTGKYARVRGAHTNDVKQLTEAVQKIATESIVIWGKTPKFRLPIQKETWETWWTEYWQATWIPEWEFVNTPPLVKLWYQLEKEPIVGAETFYVDGASNRETKLGKAGYVTDRGRQKVVSLTDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVNQIIEQLINKEKVYLAWVPAHKGIGGNEQVDKLVSTGIRKVLFLDGIDKAQEEHEKYHSNWRAMASDFNLPPVVAREIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEGKVILVAVHVASGYIEAEVIPAETGQETAYFLLKLAGRWPVKTIHTDNGSNFTSTTVKAACWWAGIKQEFGIPYNPQSQGVVESMNKELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATDIQTKELQKQITKIQNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKVKIIRDYGKQMAGDDCVASRQDED", @@ -429,9 +429,9 @@ { "name": "vif", "start": 5029, - "end": 5608, + "end": 5607, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.2608047690014903, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKHHMYVSGKAKGWFYRHHYESHHPRISSEVHVPLGDARLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPNLADQLIHLYYFDCFSESAIRSAILGHIVSPSCEYQAGHNKVGSLQYLALAALITPKRRKPPLPSVAKLTEDRWNKPQKTKGHRGSHIRNGH", @@ -441,9 +441,9 @@ { "name": "vpr", "start": 5547, - "end": 5838, + "end": 5837, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MEQAPEDQGPPREPYQEWTLELLEELKNEAVRHFPRMWLHGLGQHIYDTYGDTWTGVEAIIRILQQLLFIHFRIGCQHSRIGIIRQRRTRNGANRS", @@ -453,9 +453,9 @@ { "name": "tat_exon1", "start": 5818, - "end": 6037, + "end": 6036, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.28735632183908044, "protein": "MEPIDPRLEPWKHPGSQPKTACTSCYCKKCCFHCQVCFMTKALGISYGRKKRRQRRRASQDSQTHQVSLSKQ", @@ -465,9 +465,9 @@ { "name": "rev_exon1", "start": 5957, - "end": 6038, + "end": 6037, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.4274965800273598, "protein": "MAGRSGDSDEELLKTVRLIKFLYQSSK", @@ -477,9 +477,9 @@ { "name": "vpu", "start": 6049, - "end": 6298, + "end": 6297, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.520618556701031, "protein": "MNSLQISAIVAIVVAIILAIVVWSIVFIEYRKILRQRKIDRLIDRIRERAEDSGNESEGDQEELSTALMEMGHHAPWDVDDL", @@ -489,9 +489,9 @@ { "name": "env", "start": 6212, - "end": 8783, + "end": 8782, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.4766895145301081, "protein": "MRVKGIRKNYQQHLWRWGTMLLGMLMICSAAGNLWVTVYYGVPVWKEATTTLFCASDAKAYGTEVHNVWATHACVPTDPNPQEVRLENVTENFNMWRNPMVEQMHEDIISLWDQSLKPCVKLTPLCVTLNCTDLGQESTNNNITGSIEKGEMKNCSFNISSSKGSKGHKEYASFYKLDVVPIGNNKTNGNYSSYRLISCNTSVITQACPKVSFEPIPIHFCAPAGYAILKCNDKQFNGTGPCTNVSTVQCTHGIRPVVSTQLLLNGSLAEEEVVIRSANFTDNAKTIIVQLNQSVEITCTRPGNNTIRGVHMGPGKAFYAGAITGDIRKAHCIINKAKWNSTLRLVVAKLSEQFRNKTINFTQPSGGDPEIVTHSFNCGGEFFYCNTTKLFNSTWNATHMINGTWNDTEGNITLPCRIKQIINMWQEVGKAMYAPPIRGQIRCSSNITGLLLTRDGGKTNESNTTEIFRPGGGDMRDNWRSELYKYKVVRIEPLGVAPTKAKRRVVQREKRAVGIGALFLGFLGAAGSTMGATSMALTVQARQLLSGIVQQQNNLLRAIEAQQHLLQLTVWGVKQLQARVLALERYLKDQQLLGFWGCSGKLICTTDVPWNASWSNKSLGQIWENMTWMEWEREIDNYTSLIYTLITESQIQQEQNEKELLELDKWANLWNWFGITNWLWYIKIFIMIVGGLVGLRIVFAVLSIVNRVRQGYSPLSFQTRFPAPRGPDRPEGIEEEGGERDRDRSAPLVKGFLALIWVDLRSLCLFSYHRLRDLLLIITRIVELLGRRGWEVLKYLWSLLQYWTQELKNSAVSLLNATAIAVAEGTDRIIEVLQRVFRAILHIPTRIRQGFERALL", @@ -501,9 +501,9 @@ { "name": "tat_exon2", "start": 8364, - "end": 8460, + "end": 8459, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.3921568627450981, "protein": "RPASQPRGDPTGPKESKKKVERETETDPLH", @@ -513,9 +513,9 @@ { "name": "rev_exon2", "start": 8365, - "end": 8641, + "end": 8640, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.29843322556577967, "protein": "DPLPSPEGTRQARRNRRRRWRERQRQIRSISERILSTYLGRSTEPVPLQLPPLERLTLDNNEDCGTSGTQGVGSPQILVESPTVLDTGTKE", @@ -525,9 +525,9 @@ { "name": "nef", "start": 8784, - "end": 9387, + "end": 9386, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.3966849799795139, "protein": "MGGKWSKSSLVGWPNVRERMRRAEPAADGVGAVSRDLERHGAITSSNTATNNADCAWLEAQKEEEVGFPVTPQVPLRPMTYKAAVDLSHFLKEKGGLEGLIHSQKRQDILDLWIYHTQGYFPDWQNYTPGPGVRYPLTFGWCFKLVPVEPTDRENDRLLHPASLQGMEDPEGEVLEWRFDSRLAFHHMARELHPEYYKNC", @@ -539,9 +539,9 @@ { "name": "gag", "start": 315, - "end": 1665, + "end": 1664, "subtype_start": 789, - "subtype_end": 2292, + "subtype_end": 2291, "orientation": "forward", "distance": 0.596665989022159, "protein": "MAYSPVAAPRLLPCALQQATPQDLNTMLNTVGGHQAAMQMLKEVINEEAAEWDRLHPVHAGPIAPGQMREPRGSDIAGTTSTLQEQIGWMTHNPPIPVGEIYKRWIILGLNKIVRMYSPTSILDIKQGPKEPFRDYVDRFYKTLRAEQATQEVKNWMTETLLVQNANPDCKTILKALGPAATLEEMMTACQGVGGPGHKARVLAEAMSQATGTANILMQRGNFRNQRKPVKCFNCGKEGHIAKNCRAPRKKGCWKCGREGHQMKDCTERQANFLGKIWPSHKGRPGNFPQSRPEIPQSRPEPTAPPAPPEESFRFGEATTPSQKQETMDKELYPPLTSLRSLFGNDPSSQ", @@ -551,9 +551,9 @@ { "name": "pol", "start": 1427, - "end": 4469, + "end": 4468, "subtype_start": 2084, - "subtype_end": 5096, + "subtype_end": 5095, "orientation": "forward", "distance": 0.27887169154684477, "protein": "FFRENLAFSQGKARELSSEPTRNSSEQTRANSPTSPSRRELQVWGSNNSLSEAGDNGQGAVSSSNFPQITLWQRPIVTIKIGGQLKEALLDTGADDTVLEDIDLPGKWKPKMIGGIGGFIKVRQYEQVPIEISGHKAIGTVLVGPTPVNIIGRNLLTQLGCTLNFPISPIETVPVKLKPGMDGPKVKQWPLTEEKIKALVEICTEMEKEGKISKIGPENPYNTPVFAIKKKDGTKWRKLVDFRELNKRTQEFWEIQLGIPHPAGLKKKKSVTVLDVGDAYFSVPLDKDFRKYTAFTIPSINNETPGIRYQYNVLPQGWKGSPAIFQSSMTKILEPFRKTNPDIVIYQYMDDLYVGSDLEIGQHRTKVEELRQHLMRWGFTTPDKKHQKEPPFLWMGYELHPNKWTVQPIVLPEKESWTVNDIQKLVGKLNWASQIYAGIKVKQLCKLLRGTKALTEVVPLTEEAELELAENREILKDPVHGAYYDPAKDLIAELQKQGEGQWTYQIYQEPFKNLKTGKYARTRGAHTNDVKQLTEAVQKISTESIVIWGRTPKFRLPIQKETWETWWTDYWQATWIPEWEFVNTPPLVKLWYQLEKEPIIGAETFYVDGAANRDNKSGKAGYVTDRGRQKVVTINDTTNQKTELQAIHLALQDSGLEVNIVTDSQYALGIIQAQPDKSESELVSQIIEQLIKKEKVYLAWVPAHKGIGGNEQVDKLVSAGIRKVLFLDGIEKAQEDHEKYHSNWRTMASDFNLPPIVAKEIVASCDKCQLKGEAMHGQVDCSPGIWQLDCTHLEEKIILVAVHVASGYIEAEVIPAETGQETAYFILKLAGRWPVKTIHTDNGRNFTSNTVKAACWWAGIKQEFGIPYNPQSQGVVESMNNELKKIIGQVRDQAEHLKTAVQMAVFIHNFKRKGGIGGYSAGERIVDIIATEIQTKELQKQITKIPNFRVYYRDSRDPLWKGPAKLLWKGEGAVVIQDNSDIKVVPRRKAKIIRDYGKQMAGDDCVASRQDED", @@ -563,9 +563,9 @@ { "name": "vif", "start": 4413, - "end": 4992, + "end": 4991, "subtype_start": 5040, - "subtype_end": 5619, + "subtype_end": 5618, "orientation": "forward", "distance": 0.3566796368352788, "protein": "MENRWQVMIVWQVDRMRIRTWKSLVKYHMYISKKAKKWAYRHHYETTHPRISSEVHIPLGDDRLVITTYWGLHTGERDWHLGQGVSIEWRKRRYSTQVDPDLADHLIHVHYFDCFSESAIRNAILGHRVSPRCEYQAGHNKVGSLQYLALTAVITPKKIKPPLPSVKKLTEDRWNKPQKTKGHRESHTMNGH", @@ -575,9 +575,9 @@ { "name": "vpr", "start": 4931, - "end": 5222, + "end": 5221, "subtype_start": 5558, - "subtype_end": 5849, + "subtype_end": 5848, "orientation": "forward", "distance": 0.3808935556928146, "protein": "MEQAPEDQGPQREPYNEWTLELLEELKREAVRHFPRPWLQDLGQYIYETYGDTWTGVEAIIRILQQMLFIHFRIGCHHSRIGIVLQRRARNGASRS", @@ -587,21 +587,21 @@ { "name": "tat_exon1", "start": 5202, - "end": 5421, + "end": 5417, "subtype_start": 5829, - "subtype_end": 6045, + "subtype_end": 6044, "orientation": "forward", "distance": 0.40192926045016075, "protein": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", - "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ*", - "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAGTAA" + "aminoacids": "MEPVDHRLEPWKHPGSQPRTPCTNCYCKKCCFHCQVCFIQKALGISYGRKKRRQRRRSPQDSQTHQVPLPKQ", + "nucleotides": "ATGGAGCCAGTAGATCATAGACTAGAGCCCTGGAAGCATCCAGGAAGTCAGCCTAGGACTCCTTGTACCAATTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTGTGTTTTATACAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGAGACGAAGATCTCCTCAAGACAGTCAGACTCATCAAGTTCCTCTACCAAAGCAG" }, { "name": "rev_exon1", "start": 5341, - "end": 5422, + "end": 5421, "subtype_start": 5968, - "subtype_end": 6046, + "subtype_end": 6045, "orientation": "forward", "distance": 0.524971623155505, "protein": "MAGRSGDRDEDLLKTVRLIKFLYQSSK", @@ -611,9 +611,9 @@ { "name": "vpu", "start": 5433, - "end": 5682, + "end": 5681, "subtype_start": 6060, - "subtype_end": 6309, + "subtype_end": 6308, "orientation": "forward", "distance": 0.5244381020335356, "protein": "MQSLEILAIVALVVAAIIAIVVWTIVGIEYRKILRQRKIDKIINRIRERAEDSGNESEGDQEELSALVVEMGHDAPWDVDDL", @@ -623,9 +623,9 @@ { "name": "env", "start": 5596, - "end": 8158, + "end": 8157, "subtype_start": 6223, - "subtype_end": 8794, + "subtype_end": 8793, "orientation": "forward", "distance": 0.5152420275849952, "protein": "MRAKGIRKNCQHLWWKWGTMLLGMLMICSAAENLWVTVYYGVPVWRDANTTLFCASDAKAYDTEVHNVWATHACVPTDPNPHEVELKNVTENFNMWKNNMVDQMHEDIINLWDQSLKPCAKLTPLCVTLNCTDLRNDTVGNQTNLTETNTIQGREMTNCSFNITTEIRDKVRKEHALFYKLDVMPIDRDNTSYTLINCNTSVITQACPKVTFEPIPIHYCTPAGFAILKCKDEMFNGTGPCKNVSTVQCTHGIRPVVSTQLLLNGSLAEKEIVLRSENFTDNGKNIIVQLNRSIVINCTRPNNNTRKSISVAGRAIYATGQIIGDIRQAHCNISETDWNDTLSKIVEKLREKFGKDKTIIFNQSSGGDMEIETHSFNCGGEFFYCNTTRLFNSTWSVNGTSINGTKNITLPCRIKQIINRWQEVGKAMYAPPISGIIRCSSNITGLILTRDGGTNNSTEETETFRPGGGNMKDNWRSELYKYKVVKIEPLGVAPTKAQRRVVQREKRAIGALGAMFLGFLGAAGSTMGAASLTLTVQARQLLSGIVQQQNNLLRAIEAQQHMLQLTVWGIKQLQARVLSVERYLQDQQLLGIWGCSGKLICTTTVPWNTSWSNKSYDTIWDNMTWMQWDREIQNYTGKIYNLLEESQIQQEKNEKELLELDQWANLWNWFSITKWLWYIKIFIMIVGGLVGLKIIFAVFSIVNRVRQGYSPLSLQTLLPTPRGPDRPEGIEEEGGERDRGRSGRLVTGFLPLIWDDLRSLCLFSYHHLRDLLLIVLRTVQVLGHRGWEILKYWWSLLQYWIQELKNSAVSLLNTIAIAVAEGTDRVIEVGQRIGRAFLHIPRRIRQGLERALQ", @@ -635,9 +635,9 @@ { "name": "tat_exon2", "start": 7739, - "end": 7835, + "end": 7834, "subtype_start": 8375, - "subtype_end": 8471, + "subtype_end": 8470, "orientation": "forward", "distance": 0.6842105263157894, "protein": "RPSSQPRGDQTGPKE", @@ -647,9 +647,9 @@ { "name": "rev_exon2", "start": 7740, - "end": 8016, + "end": 8015, "subtype_start": 8376, - "subtype_end": 8652, + "subtype_end": 8651, "orientation": "forward", "distance": 0.4267425320056898, "protein": "DPPPNPEGTRQARRNRRRRWRERQRQIRKISDWILTTHLGRPAEPVPLQLPPLERLTLDCAEDCASSGTQGVGDPQVLVESPAVLDSGTKE", @@ -659,9 +659,9 @@ { "name": "nef", "start": 8159, - "end": 8813, + "end": 8812, "subtype_start": 8795, - "subtype_end": 9416, + "subtype_end": 9415, "orientation": "forward", "distance": 0.4891015417331206, "protein": "MGGKWSKGCMAGWPTVRERMERIDPRPAARREQAEPAAAGVGAASRDLEKYGAITSSNTSTTNAACAWLEAQEEEEVGFPVRPQVPLRPMTYKAALDLSHFLKEKGGLEGLIWSQRRQEILDLWVYHTQGYFPDWQNYTPGPGVRFPLTFGWCFKLVPVDPDQVEKANEGENNCLLHPMSLHGMEDSEGEVLMWKFDSSLAFHHRAREQHPEYYKDC", diff --git a/util/find_orf.py b/util/find_orf.py index fbfb8f5..7248828 100644 --- a/util/find_orf.py +++ b/util/find_orf.py @@ -52,7 +52,7 @@ def find_candidate_positions(aligned_sequence, e): visited_set.add(got_aminoacids) closest_start = (closest_start_a * 3) + frame - closest_end = (closest_end_a * 3) + 3 + frame + closest_end = (closest_end_a * 3) + 3 + frame - 1 got_protein = get_biggest_protein(has_start_codon(e), got_aminoacids) dist = detailed_aligner.align(got_protein, expected_protein).distance() orf = OriginalORF(