diff --git a/intact/intact.py b/intact/intact.py index 5085fd7..2b356b2 100644 --- a/intact/intact.py +++ b/intact/intact.py @@ -21,6 +21,7 @@ MISPLACEDORF_ERROR = "MisplacedORF" LONGDELETION_ERROR = "LongDeletion" DELETIONINORF_ERROR = "DeletionInOrf" +INSERTIONINORF_ERROR = "InsertionInOrf" INTERNALSTOP_ERROR = "InternalStopInOrf" SCRAMBLE_ERROR = "Scramble" NONHIV_ERROR = "NonHIV" @@ -600,10 +601,6 @@ def small_frames( aligner = Align.PairwiseAligner() aligner.mode = 'global' - aligner.match_score = 2 - aligner.mismatch_score = -1 - aligner.open_gap_score = -0.5 - aligner.extend_gap_score = -0.1 def translate(seq, frame = 0, to_stop = False): for_translation = seq[frame:] @@ -659,13 +656,43 @@ def find_real_correspondence(e): candidates = list(find_candidate_positions(e, q_start, q_end)) return min(candidates, key=lambda x: x.distance) + def get_indel_impact(alignment): + shift = 0 + impacted = 0 + counter = 0 + good = 0 + for (x, y) in zip(alignment[0], alignment[1]): + if x == "-" and y == "-": + continue + if x == "-" and y != "-": + shift += 1 + if x != "-" and y == "-": + shift -= 1 + if shift % 3 != 0: + counter += 1 + good = 0 + else: + good += 1 + if good > 5: + impacted += counter if counter > 30 else 0 + counter = 0 + + impacted += counter if counter > 30 else 0 + return impacted + errors = [] for e in expected: best_match = find_real_correspondence(e) got_protein = best_match.aminoseq.split("*")[0] exp_protein = best_match.expectedaminoseq.split("*")[0] + + got_nucleotides = sequence.seq[best_match.start:best_match.start + len(got_protein) * 3] + exp_nucleotides = reference[e.start:e.end].upper() + orf_alignment = aligner.align(exp_nucleotides, got_nucleotides)[0] + deletions = (len(exp_protein) - len(got_protein)) * 3 + insertions = (len(got_protein) - len(exp_protein)) * 3 # Max deletion allowed in ORF exceeded if deletions > e.deletion_tolerence: @@ -687,25 +714,37 @@ def find_real_correspondence(e): + str(deletions) )) - got_nucleotides = sequence.seq[best_match.start:best_match.start + len(got_protein) * 3] - exp_nucleotides = reference[e.start:e.end].upper() + continue - alignment = aligner.align(exp_nucleotides, got_nucleotides)[0] + # Max insertions allowed in ORF exceeded + if insertions > 3 * e.deletion_tolerence: - insertions = len(re.findall(r"-", str(alignment[0]))) - deletions = len(re.findall(r"-", str(alignment[1]))) + errors.append(IntactnessError( + sequence.id, INSERTIONINORF_ERROR, + "Smaller ORF " + str(e.name) + " at " + str(e.start) + + "-" + str(e.end) + + " can have maximum insertions " + + str(3 * e.deletion_tolerence) + ", got " + + str(insertions) + )) + + continue + + impacted_by_indels = get_indel_impact(orf_alignment) # Check for frameshift in ORF - if (deletions - insertions) % 3 != 0: + if impacted_by_indels >= e.deletion_tolerence + 0.10 * len(exp_nucleotides): errors.append(IntactnessError( sequence.id, FRAMESHIFTINORF_ERROR, "Smaller ORF " + str(e.name) + " at " + str(e.start) + "-" + str(e.end) - + " contains an out of frame indel: insertions " + str(insertions) - + " deletions " + str(deletions) + "." + + " contains out of frame indels that impact " + str(impacted_by_indels) + + " positions." )) + continue + return errors diff --git a/tests/expected-results-large/errors.json b/tests/expected-results-large/errors.json index 8363047..362b826 100644 --- a/tests/expected-results-large/errors.json +++ b/tests/expected-results-large/errors.json @@ -20,11 +20,6 @@ "error": "DeletionInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 can have maximum deletions 30, got 213" }, - { - "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 0 deletions 212." - }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", @@ -32,13 +27,13 @@ }, { "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 0 deletions 73." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon" }, { "sequence_name": "KX505501.1", - "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon" + "error": "FrameshiftInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8468 contains out of frame indels that impact 80 positions." }, { "sequence_name": "KX505501.1", @@ -67,16 +62,6 @@ } ], "MN691959": [ - { - "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 2 deletions 1." - }, - { - "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 3 deletions 1." - }, { "sequence_name": "MN691959", "error": "InternalStopInOrf", @@ -99,6 +84,11 @@ "error": "DeletionInOrf", "message": "Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" }, + { + "sequence_name": "MN692074", + "error": "InsertionInOrf", + "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" + }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", @@ -107,12 +97,17 @@ { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 1 deletions 153." + "message": "Smaller ORF rev_exon1 at 5968-6044 contains out of frame indels that impact 51 positions." + }, + { + "sequence_name": "MN692074", + "error": "InsertionInOrf", + "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 18 deletions 31." + "message": "Smaller ORF tat_exon2 at 8375-8468 contains out of frame indels that impact 81 positions." }, { "sequence_name": "MN692074", @@ -135,18 +130,7 @@ "message": "Query sequence contains a long deletion." } ], - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 5 deletions 4." - }, - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - } - ], + "MN692145": [], "MN090335": [ { "sequence_name": "MN090335", @@ -163,16 +147,6 @@ "error": "FrameshiftInOrf", "message": "ORF gag at 1175-2291 contains an out of frame indel, deletions 91 insertions 33." }, - { - "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 7 deletions 6." - }, - { - "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MN090335", "error": "InternalStopInOrf", @@ -205,16 +179,6 @@ "error": "WrongORFNumber", "message": "Expected 3 forward ORFs, got 2" }, - { - "sequence_name": "MN090376", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 18 deletions 17." - }, - { - "sequence_name": "MN090376", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 9 deletions 7." - }, { "sequence_name": "MN090376", "error": "PackagingSignalDeletion", @@ -236,29 +200,8 @@ "message": "Sequence contains an internal inversion." } ], - "MK115581.1": [ - { - "sequence_name": "MK115581.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115581.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115581.1": [], "MK115690.1": [ - { - "sequence_name": "MK115690.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 5 deletions 4." - }, - { - "sequence_name": "MK115690.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 5 deletions 3." - }, { "sequence_name": "MK115690.1", "error": "PackagingSignalDeletion", @@ -271,16 +214,6 @@ } ], "MK115571.1": [ - { - "sequence_name": "MK115571.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115571.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MK115571.1", "error": "PackagingSignalDeletion", @@ -293,16 +226,6 @@ } ], "MK115514.1": [ - { - "sequence_name": "MK115514.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115514.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MK115514.1", "error": "MajorSpliceDonorSiteMutated", @@ -310,16 +233,6 @@ } ], "MK115488.1": [ - { - "sequence_name": "MK115488.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115488.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MK115488.1", "error": "MajorSpliceDonorSiteMutated", @@ -332,16 +245,6 @@ "error": "MisplacedORF", "message": "Expected an ORF, gag, at 789-2292 in the forward strand, got 765-2282" }, - { - "sequence_name": "MK115030.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 11 deletions 10." - }, - { - "sequence_name": "MK115030.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 5." - }, { "sequence_name": "MK115030.1", "error": "Scramble", @@ -353,18 +256,7 @@ "message": "Sequence contains an internal inversion." } ], - "MK115498.1": [ - { - "sequence_name": "MK115498.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115498.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115498.1": [], "MK115211.1": [ { "sequence_name": "MK115211.1", @@ -376,16 +268,6 @@ "error": "MisplacedORF", "message": "Expected an ORF, env, at 6223-8794 in the forward strand, got 6955-8793" }, - { - "sequence_name": "MK115211.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 13 deletions 12." - }, - { - "sequence_name": "MK115211.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 12 deletions 7." - }, { "sequence_name": "MK115211.1", "error": "PackagingSignalDeletion", @@ -418,16 +300,6 @@ "error": "FrameshiftInOrf", "message": "ORF gag at 709-2282 contains an out of frame indel, deletions 20 insertions 0." }, - { - "sequence_name": "MK115158.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 17 deletions 16." - }, - { - "sequence_name": "MK115158.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 12 deletions 7." - }, { "sequence_name": "MK115158.1", "error": "PackagingSignalDeletion", @@ -440,16 +312,6 @@ } ], "MK114705.1": [ - { - "sequence_name": "MK114705.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 13 deletions 12." - }, - { - "sequence_name": "MK114705.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 11 deletions 6." - }, { "sequence_name": "MK114705.1", "error": "InternalStopInOrf", @@ -482,16 +344,6 @@ "error": "InternalStopInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon" }, - { - "sequence_name": "MK114856.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 0 deletions 185." - }, - { - "sequence_name": "MK114856.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MK114856.1", "error": "InternalStopInOrf", @@ -539,16 +391,6 @@ "error": "DeletionInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 can have maximum deletions 30, got 54" }, - { - "sequence_name": "MK115009.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 9 deletions 62." - }, - { - "sequence_name": "MK115009.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 5." - }, { "sequence_name": "MK115009.1", "error": "InternalStopInOrf", @@ -576,50 +418,19 @@ } ], "MK115387.1": [ - { - "sequence_name": "MK115387.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 4 deletions 3." - }, - { - "sequence_name": "MK115387.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 8 deletions 3." - }, { "sequence_name": "MK115387.1", "error": "InternalStopInOrf", "message": "Smaller ORF tat_exon2 at 8375-8468 contains an internal stop codon" } ], - "MK115491.1": [ - { - "sequence_name": "MK115491.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115491.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115491.1": [], "MK116110.1": [ { "sequence_name": "MK116110.1", "error": "WrongORFNumber", "message": "Expected 3 forward ORFs, got 2" }, - { - "sequence_name": "MK116110.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 9 deletions 8." - }, - { - "sequence_name": "MK116110.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 8 deletions 6." - }, { "sequence_name": "MK116110.1", "error": "PackagingSignalDeletion", @@ -636,47 +447,15 @@ "message": "Sequence contains an internal inversion." } ], - "MK115527.1": [ - { - "sequence_name": "MK115527.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115527.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115527.1": [], "MK114997.1": [ { "sequence_name": "MK114997.1", "error": "WrongORFNumber", "message": "Expected 3 forward ORFs, got 4" - }, - { - "sequence_name": "MK114997.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 13 deletions 12." - }, - { - "sequence_name": "MK114997.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 5." - } - ], - "MK115518.1": [ - { - "sequence_name": "MK115518.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115518.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." } ], + "MK115518.1": [], "MK115065.1": [ { "sequence_name": "MK115065.1", @@ -688,16 +467,6 @@ "error": "DeletionInOrf", "message": "ORF gag at 657-2282 can have maximum deletions 30, got 75" }, - { - "sequence_name": "MK115065.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 11 deletions 10." - }, - { - "sequence_name": "MK115065.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 5." - }, { "sequence_name": "MK115065.1", "error": "PackagingSignalDeletion", @@ -735,16 +504,6 @@ "error": "InternalStopInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 contains an internal stop codon" }, - { - "sequence_name": "MK115464.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 0 deletions 194." - }, - { - "sequence_name": "MK115464.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 5 deletions 3." - }, { "sequence_name": "MK115464.1", "error": "InternalStopInOrf", @@ -771,34 +530,13 @@ "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 4.937891251407691e-23)." } ], - "MK115530.1": [ - { - "sequence_name": "MK115530.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115530.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115530.1": [], "MK115520.1": [ { "sequence_name": "MK115520.1", "error": "WrongORFNumber", "message": "Expected 3 forward ORFs, got 4" }, - { - "sequence_name": "MK115520.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115520.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - }, { "sequence_name": "MK115520.1", "error": "MajorSpliceDonorSiteMutated", @@ -810,29 +548,8 @@ "message": "Sequence contains an internal inversion." } ], - "MK115503.1": [ - { - "sequence_name": "MK115503.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115503.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - } - ], + "MK115503.1": [], "MK115570.1": [ - { - "sequence_name": "MK115570.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115570.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MK115570.1", "error": "PackagingSignalDeletion", @@ -844,18 +561,7 @@ "message": "Query sequence has a missing splice donor site, --." } ], - "MK115509.1": [ - { - "sequence_name": "MK115509.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115509.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115509.1": [], "MK115702.1": [ { "sequence_name": "MK115702.1", @@ -872,16 +578,6 @@ "error": "FrameshiftInOrf", "message": "ORF env at 6199-8764 contains an out of frame indel, deletions 50 insertions 37." }, - { - "sequence_name": "MK115702.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 12 deletions 11." - }, - { - "sequence_name": "MK115702.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 10 deletions 8." - }, { "sequence_name": "MK115702.1", "error": "PackagingSignalDeletion", @@ -919,16 +615,6 @@ "error": "DeletionInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 can have maximum deletions 30, got 54" }, - { - "sequence_name": "MK115095.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 8 deletions 61." - }, - { - "sequence_name": "MK115095.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 5." - }, { "sequence_name": "MK115095.1", "error": "InternalStopInOrf", @@ -950,41 +636,9 @@ "message": "Query sequence shows evidence of APOBEC3F/G-mediated hypermutation (p = 8.33506116803153e-40)." } ], - "MK115490.1": [ - { - "sequence_name": "MK115490.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115490.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], - "MK115576.1": [ - { - "sequence_name": "MK115576.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "MK115576.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - } - ], + "MK115490.1": [], + "MK115576.1": [], "OQ092466": [ - { - "sequence_name": "OQ092466", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 6 deletions 5." - }, - { - "sequence_name": "OQ092466", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 5 deletions 3." - }, { "sequence_name": "OQ092466", "error": "MajorSpliceDonorSiteMutated", @@ -992,16 +646,6 @@ } ], "OQ092463": [ - { - "sequence_name": "OQ092463", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 8 deletions 7." - }, - { - "sequence_name": "OQ092463", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 3 deletions 1." - }, { "sequence_name": "OQ092463", "error": "PackagingSignalDeletion", @@ -1014,16 +658,6 @@ } ], "OQ092465": [ - { - "sequence_name": "OQ092465", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 8 deletions 7." - }, - { - "sequence_name": "OQ092465", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 3 deletions 1." - }, { "sequence_name": "OQ092465", "error": "MajorSpliceDonorSiteMutated", @@ -1031,16 +665,6 @@ } ], "OQ092462": [ - { - "sequence_name": "OQ092462", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 6 deletions 5." - }, - { - "sequence_name": "OQ092462", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 5 deletions 3." - }, { "sequence_name": "OQ092462", "error": "PackagingSignalDeletion", @@ -1053,16 +677,6 @@ } ], "OQ092464": [ - { - "sequence_name": "OQ092464", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 8 deletions 7." - }, - { - "sequence_name": "OQ092464", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 3 deletions 1." - }, { "sequence_name": "OQ092464", "error": "PackagingSignalDeletion", @@ -1075,16 +689,6 @@ } ], "OQ092467": [ - { - "sequence_name": "OQ092467", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 3 deletions 2." - }, - { - "sequence_name": "OQ092467", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - }, { "sequence_name": "OQ092467", "error": "PackagingSignalDeletion", diff --git a/tests/expected-results-large/intact.fasta b/tests/expected-results-large/intact.fasta index e69de29..2d494f4 100644 --- a/tests/expected-results-large/intact.fasta +++ b/tests/expected-results-large/intact.fasta @@ -0,0 +1,1754 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA +>MK115581.1 +AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA +ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA +TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT +AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT +GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG +AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA +GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG +CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG +ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT +TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT +CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG +AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG +TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA +AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA +TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG +CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG +CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC +ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA +GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA +GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC +CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG +TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA +GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA +AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT +TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG +GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA +ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT +GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA +AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG +GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC +CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA +AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA +GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG +AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT +AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG +TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG +AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT +ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA +AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC +AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG +TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG +GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT +ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC +TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT +GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT +AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA +TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA +TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT +TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA +AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG +TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC +ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA +AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA +AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA +TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT +AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA +ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC +CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA +ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG +AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC +CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA +TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC +ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA +GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT +AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC +CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT +ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA +GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT +AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT +TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG +GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC +CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA +AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA +GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA +AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT +ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG +GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC +AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT +TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA +TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT +GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC +CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG +AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG +TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT +CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG +GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA +GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC +AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA +ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA +TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA +ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC +ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG +GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC +AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC +GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG +TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA +TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA +GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG +AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG +TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA +TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG +GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA +GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG +CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA +CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG +GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA +AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT +GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA +AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA +AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA +TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA +GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA +CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT +ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA +CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA +AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC +CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA +CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA +AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA +GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA +CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA +GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA +TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG +GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG +TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC +AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC +AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG +GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT +TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA +GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG +GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT +AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA +GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA +CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC +GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG +GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC +TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC +AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC +TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA +CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG +GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT +AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA +CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC +CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC +TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG +GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA +CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA +TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA +AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA +AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA +GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG +GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC +TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC +CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG +CACTCAAGGCAAGCT +>MK115498.1 +AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC +TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG +GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC +TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA +CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT +CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA +ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA +GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA +GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT +CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG +GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA +ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT +AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA +GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA +GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG +GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA +GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC +ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA +ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT +GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT +ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA +GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT +ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG +TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA +ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA +GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA +GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA +GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC +ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA +CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC +CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA +GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC +AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA +TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT +TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT +TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG +GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC +TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC +CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT +TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA +ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT +TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA +TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG +CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA +GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA +AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC +AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG +AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC +TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC +TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG +TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA +TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC +CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG +TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA +ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT +ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA +AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC +AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT +GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA +TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA +AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA +ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA +ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG +AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG +CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA +CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA +AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA +AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG +TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC +TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG +GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC +ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG +GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA +TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA +CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT +ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC +AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC +TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA +ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC +AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT +TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC +TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA +TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG +GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA +GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC +ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC +TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA +CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC +AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG +TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG +GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC +ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA +ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT +CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA +AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA +GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT +CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG +ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT +GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA +TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC +TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC +CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC +CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC +AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA +TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA +TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA +AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA +ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC +ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC +AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA +GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA +GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT +TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT +ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG +AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT +TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA +TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA +TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC +TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG +CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC +CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG +TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG +GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC +CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT +CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT +ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT +TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG +AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC +TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT +GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC +AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA +ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT +GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT +TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC +CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA +AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA +CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC +AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT +CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC +CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC +TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG +GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC +GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG +CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG +AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT +TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA +TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT +TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT +GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT +TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA +AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA +AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG +GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC +GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT +AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115491.1 +CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT +TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT +CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG +ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC +TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG +GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC +GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA +GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG +CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA +TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA +AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA +ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT +CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT +GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG +AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA +ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC +TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG +AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA +TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG +AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC +AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA +TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA +TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC +AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG +AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA +ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA +TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA +TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA +AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC +CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG +AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT +TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG +AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT +CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA +AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG +AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA +TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC +ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC +CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT +TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT +GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT +TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA +TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA +AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA +TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG +GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA +AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA +TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA +AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA +TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT +ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT +GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA +ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT +AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC +ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT +TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA +CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT +AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG +GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC +CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA +TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG +AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC +AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA +TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT +AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG +AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT +TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC +AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA +TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG +GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG +TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT +CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT +CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT +TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT +TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT +CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT +AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA +AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT +TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC +AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT +GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG +TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA +TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG +GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA +AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT +ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC +CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA +AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG +AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG +GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG +GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA +GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA +TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC +TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA +AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG +GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT +CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG +GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA +GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA +AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG +GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA +GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT +GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA +GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA +AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG +CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT +AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC +AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT +GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA +GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC +CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT +AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA +CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC +AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC +AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA +GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT +ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT +AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA +TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG +AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC +AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT +TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG +ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT +AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG +CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA +GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT +GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG +CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC +CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT +GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG +ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT +GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG +GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA +ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT +AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA +CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT +CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC +CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA +CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG +CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA +GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA +ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG +TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG +GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC +AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT +TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG +CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA +TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC +ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT +GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA +TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT +TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT +CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG +GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT +CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA +GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC +GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG +TA +>MK115527.1 +ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC +GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA +CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT +AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG +CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA +GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA +ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC +ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT +GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT +AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA +GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC +TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT +TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC +ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA +CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG +AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC +AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA +AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC +CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA +ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT +CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG +GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG +ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG +GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA +ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA +TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT +TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG +TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA +TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG +TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG +CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA +ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT +GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT +TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG +AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC +AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG +GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC +AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT +GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT +CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG +AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC +TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC +AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT +TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA +CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT +TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC +AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA +TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA +TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT +CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT +GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA +ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT +CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC +AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC +AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA +AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG +GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC +AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA +AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA +ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC +TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA +AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA +CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA +TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT +CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA +GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA +AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA +AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA +AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA +GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA +TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG +AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA +TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA +AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG +ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA +GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG +TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA +TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG +AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA +CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA +CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG +GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT +CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA +GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG +GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA +TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA +GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC +AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG +AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG +CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA +AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC +ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA +GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA +ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT +GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT +GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC +CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT +GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC +AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG +TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA +TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA +AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA +GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG +ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT +GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA +GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA +GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG +ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC +CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT +GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA +AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT +AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT +CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT +CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA +CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA +GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA +GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA +AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA +AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT +GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG +GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA +ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT +GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA +AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG +TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA +GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG +CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA +GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA +GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA +AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC +ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC +CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT +AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA +AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG +CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG +TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG +ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT +TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA +ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC +TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA +GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC +CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT +AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA +GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA +AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC +TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG +AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG +CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT +GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA +GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT +CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG +ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA +TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA +AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA +GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG +CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA +TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG +AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC +T +>MK115518.1 +TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG +CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT +AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG +CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC +TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG +CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC +CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT +AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC +CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT +CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG +CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC +GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA +TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT +AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC +AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA +ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT +ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA +GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT +AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC +ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC +ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA +TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG +ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG +TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC +ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT +AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG +AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA +AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT +AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG +GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA +TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG +TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA +ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG +GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC +AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA +GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG +CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA +GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA +GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT +GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA +AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA +CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA +GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA +AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT +ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG +GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA +CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT +GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG +CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA +GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT +GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT +CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT +TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA +AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT +CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA +CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA +ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA +GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT +CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA +ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA +TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC +ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA +TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA +GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC +CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT +TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA +CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG +GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA +GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC +CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA +CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG +GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA +GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT +ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG +CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC +GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA +GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG +GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA +GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA +CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG +GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA +GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT +AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT +TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG +GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC +ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA +ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT +TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC +TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG +ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG +AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA +GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA +CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT +ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA +CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA +CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG +AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA +AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG +ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT +ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT +AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG +GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA +AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT +TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT +GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG +CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG +GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC +ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC +TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG +AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA +ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG +ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA +AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA +AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT +GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG +AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC +ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA +TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC +AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA +AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC +CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC +AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA +ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG +CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC +TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG +ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT +TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG +GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT +CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA +ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA +AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG +GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT +GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG +AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG +AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA +ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG +GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC +CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG +AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG +CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT +TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA +AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT +TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC +AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG +CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA +AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC +CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC +TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT +TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG +GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC +AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT +CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA +GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA +GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG +CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG +GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT +GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC +TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115530.1 +TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC +GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG +ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC +AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG +CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT +GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG +CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG +CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA +GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC +TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT +GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA +AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA +AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG +AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT +CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA +TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA +AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT +ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT +TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT +TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG +GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT +GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA +GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA +ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA +AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC +CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG +AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA +CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG +GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT +CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT +TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT +GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT +TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC +CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT +CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT +TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA +TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA +AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA +AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT +TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA +AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT +GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA +AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA +AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA +CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT +AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA +GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA +CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA +AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA +TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG +ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC +ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT +GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG +GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC +CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA +CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT +AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT +TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA +ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC +TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG +GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG +GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC +TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT +TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT +GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT +TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT +AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA +ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA +TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT +TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA +AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC +ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC +AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG +GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT +TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA +AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG +AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA +AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC +AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA +TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA +AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA +AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA +TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA +AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC +ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG +AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA +CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT +CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC +AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC +CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG +AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT +AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG +ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC +CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT +TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC +ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC +ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA +GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT +AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG +CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC +AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG +AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG +GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA +CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC +ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA +GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA +CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA +ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT +AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA +ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA +GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC +TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG +ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA +GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT +TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA +ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG +AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT +ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA +GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA +GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT +ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA +GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA +GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA +GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA +GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT +GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA +GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC +GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG +CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG +GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG +CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT +GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG +GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC +CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT +TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA +TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA +TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA +GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA +TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG +AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA +ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT +ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA +GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG +GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC +TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC +TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA +TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA +GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA +AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG +GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC +CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC +CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC +GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG +AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT +TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC +AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT +CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT +GCCT +>MK115503.1 +GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG +AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG +CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA +ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT +AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG +ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC +AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG +CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT +AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC +CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT +AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA +CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA +AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT +AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA +ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC +TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT +TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT +ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA +AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG +CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC +ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT +CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT +AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA +AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT +GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC +ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT +GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG +ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA +AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC +AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC +AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG +CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT +TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG +GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG +ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT +TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC +AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT +CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA +GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA +TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG +ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT +GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT +AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA +CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA +AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT +ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG +AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG +AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA +GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT +AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT +AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA +TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA +GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG +AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG +CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA +AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC +CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA +CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA +AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT +CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT +AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA +TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG +GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA +GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA +GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA +AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT +TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA +TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA +GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT +GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA +GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG +GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA +TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA +CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA +TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG +AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC +AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC +TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA +GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC +CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT +ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT +TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC +TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG +AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA +AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC +AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG +TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT +GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG +GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT +TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG +GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC +ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA +TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA +TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC +CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC +ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC +AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA +GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA +GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG +GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT +ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT +AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA +AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA +CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA +CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT +ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA +AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC +CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA +ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT +GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA +CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA +TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG +TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA +TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG +CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA +ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT +TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG +CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA +ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA +TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT +TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC +ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT +TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG +CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT +GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT +CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT +TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG +TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA +GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA +GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA +TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC +TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC +AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG +TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT +GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA +AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA +GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA +TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG +TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG +ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT +TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT +GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA +GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA +AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA +GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA +GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG +GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG +GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT +ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA +GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC +TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC +CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA +GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG +CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG +ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT +CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC +AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT +GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG +TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT +CAATAAAGCTTGCCTTG +>MK115509.1 +CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT +AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC +TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT +CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG +ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG +GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC +TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA +TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC +AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG +GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA +TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA +TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG +GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT +AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA +GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA +CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG +CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG +GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA +TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA +GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG +CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC +ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT +ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG +ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC +TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT +TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA +GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA +CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA +ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC +AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT +GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA +ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA +GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG +GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC +CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG +ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG +GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC +ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC +TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG +TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA +AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA +TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA +AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG +TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG +ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT +TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC +CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC +CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG +GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT +TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA +TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG +ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA +TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA +CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT +TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC +AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA +AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG +AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA +GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT +GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG +AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA +CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA +CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG +GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC +CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA +AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA +AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG +AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC +CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA +TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG +GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC +CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG +TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT +GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG +TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG +AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG +GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA +CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA +GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG +TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG +ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA +ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT +TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA +GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG +CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC +CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT +ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT +AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA +AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG +ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA +AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT +ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC +TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA +GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT +CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT +TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA +AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT +GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA +ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA +GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG +GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT +GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA +AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA +TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT +GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA +GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG +TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG +AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA +GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA +TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT +ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG +TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC +ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA +AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT +GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC +TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC +ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT +AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA +AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT +GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT +CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT +GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT +AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT +GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG +AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT +AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT +GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT +GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA +GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT +TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG +TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT +TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA +AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT +AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT +AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT +ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA +AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT +TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT +CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA +TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT +CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG +AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT +GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG +AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG +AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC +TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA +GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC +TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC +TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG +AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG +TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC +CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC +TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT +ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG +AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115490.1 +CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG +GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC +TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC +AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA +ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC +TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG +GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA +ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA +GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA +AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA +AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA +AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT +AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA +TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC +AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA +GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC +CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA +GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA +GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT +ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA +GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA +GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA +GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT +AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA +GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG +ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA +GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC +CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG +CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA +GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG +GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG +CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA +CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA +AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG +TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA +CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG +GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG +CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA +CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT +TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA +AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC +CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA +GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT +TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG +GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA +TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG +GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA +GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG +ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT +GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT +ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT +GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG +CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG +TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG +AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC +AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG +GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG +TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC +CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC +CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG +AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT +TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA +CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG +AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA +AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT +ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG +TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC +ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG +TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG +GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG +TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG +AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA +CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT +GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG +AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC +TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG +GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG +AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG +ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC +AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG +GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG +AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA +CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT +GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG +GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC +CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA +AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG +GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA +CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG +GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG +AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA +CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT +TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG +CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT +AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC +ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT +CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG +CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT +GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG +TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG +GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG +TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC +AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT +TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA +TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT +AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC +TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT +GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA +GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG +TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT +TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA +TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG +AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT +AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA +ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG +ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG +TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA +ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT +AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA +TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT +CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC +CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG +AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA +CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC +ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC +TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT +GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG +AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA +GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG +TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA +ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA +TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA +ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA +ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT +AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT +TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG +TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG +GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT +TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG +GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT +CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG +TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA +AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA +TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC +ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG +CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA +TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG +GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG +GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT +TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA +ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA +TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT +ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA +GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC +AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT +CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT +>MK115576.1 +AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT +AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG +CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG +AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC +CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA +GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT +CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG +TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA +GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG +GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT +GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA +CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC +CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA +GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC +ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT +CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC +AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA +AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC +ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA +CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG +GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA +TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT +ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA +AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA +AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG +GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT +GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC +CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC +AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC +TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA +GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT +GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC +TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC +AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT +TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC +AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG +GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA +ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC +CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA +CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC +CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG +AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG +GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC +CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA +CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA +TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG +TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA +GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA +AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT +GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA +AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT +TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG +CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT +ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT +ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG +GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA +GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG +AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA +CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA +CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA +CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT +TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT +CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA +ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC +ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG +TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT +GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA +GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG +GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG +TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT +ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA +GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT +TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA +AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG +CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA +GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA +AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG +CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG +TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG +ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT +ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT +CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA +TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA +TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT +CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA +GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG +GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA +CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA +ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA +GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG +GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT +GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT +CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC +TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC +TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT +CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA +ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA +GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA +AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG +GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG +GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC +ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT +ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT +GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG +CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA +TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG +CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA +TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA +CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA +TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG +ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC +TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT +CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC +AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC +AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG +GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT +AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG +AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG +GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT +TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT +TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA +GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA +TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG +AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG +AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT +ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA +TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA +AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG +CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA +TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC +CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA +TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT +ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT +AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC +GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG +ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG +CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT +TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT +TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA +GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC +TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA +AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG +CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA +ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG +TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG +ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA +GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA +ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG +TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA +GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC +TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT +GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG +GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG +GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC +TGCTTAAGCCTCAATAAAGCTTGCCT diff --git a/tests/expected-results-large/nonintact.fasta b/tests/expected-results-large/nonintact.fasta index 9113fa3..29434e4 100644 --- a/tests/expected-results-large/nonintact.fasta +++ b/tests/expected-results-large/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA @@ -731,166 +568,6 @@ CCGCTAGGGACTTTCCAGGGGAGGCGTGAACTGGGCGGGACAGGGGAGTGGCGAGCCCTC AGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGGTCTCTCTGGTTAGACCAGAT CAGAGCCTGGGAGCTCTCTGGCTAGCTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT GCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC ->MK115581.1 -AAATTGGGACGTTCGCCTACGCAAGCGAAAATTTCTCTACGTAGCCACCTTTCCCGATTA -ACGTCAGAACCCTAAAATTAAAATAAATCCTAGCGGCCGACCGACTCTGGTAACTAGAGA -TCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAATCATCTT -AGAGTGGCGCCCGAACGACTCTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGT -GGCGCCCGCGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCG -AGACTCTGGTAACTAGAGATCCCTCAGATTAAATCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCAAAGATAAATCTCTAGCAGTGGCGCCCGACACAGGTACTA -GAGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAG -CGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAG -ATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATT -TAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACAT -CAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAG -AACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGG -TACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAA -AGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCA -TAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATG -CATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAG -CATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGAC -ATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATA -GATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAA -GTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATC -CACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAG -TAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTA -GAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAA -AAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTT -TAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGG -GGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTA -ATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATT -GTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGA -AATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAG -GGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGC -CAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGA -AGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCA -GCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGG -AGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGAT -AGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTG -TGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAG -AAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGT -ACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGA -AGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTC -AAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAG -TACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTG -GGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGT -ACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATAC -TGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGT -GCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTT -AGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTA -TGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACA -TCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCT -TTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGA -AAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAG -TCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGC -ACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGA -AATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGA -AGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAA -TCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATT -AACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAA -ATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGC -CACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCA -ATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAG -AGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTC -CCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGA -TTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGC -ACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAA -GGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGT -AGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGC -CCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATAT -ACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGA -GGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCT -AGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGT -TATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATG -GCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGC -CGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCA -AGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCA -GGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAA -AGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCT -ACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAG -GGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGC -AGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCAT -TAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGA -TTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGAT -GGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCC -CACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAG -AATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAG -TTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAAT -CTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAG -GACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGA -GAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACC -AGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGA -ACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACA -TATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCA -ACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCC -ACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAG -GAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCC -AAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGC -GACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAG -TATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAA -TAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAA -GGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTG -AAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATG -TTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTA -TGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAG -GCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTA -GGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATG -CATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCA -CTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAG -GAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGA -AATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAAT -GATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCA -AAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTA -AAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAA -TGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCA -GAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTA -CATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGT -ATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGA -CAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAA -AAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGAC -CCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACA -CAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGA -AACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAA -GCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTA -CTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGA -GATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCA -TTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTG -GGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCG -TCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAAC -AATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATC -AAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTG -GGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGT -TGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGA -GAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAG -GAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTT -AACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATA -GGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCA -CCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATC -GAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTG -GCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGAC -TTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTC -AAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGC -TTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTA -CAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGG -GCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGT -AAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGA -CCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGC -CTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCC -TTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGG -GGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTA -CAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATA -TCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCA -AGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAA -AGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAA -GCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTG -GGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGC -TGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGC -CTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTG -CACTCAAGGCAAGCT >MK115690.1 TGGAAGGGATAATTTACTCCCAAAAAAGACAAGATATTCTTGATCTGTGGGTCTACAACA CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACTAGATTTCCAC @@ -1686,165 +1363,6 @@ CCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGAC CAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAA AGCTTGCCTTGCACTCAAGGCAAGCTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAAC TAGAGA ->MK115498.1 -AACACGGAATGGGAGATAAGCAGCATCTCTATCGGCGCGGCGAGATCTGACACTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCCTAAATCTC -TAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTG -GCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCC -TCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAA -CTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACTAGAGATCCCT -CACCCTAGATCTCTAGCAGTGGCGCCCGCGAAGGCACTAGGACCTGAAAGCGAAAGTAAA -ACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGA -GGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGA -GAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATT -CGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGG -GAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAA -ATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTT -AATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAA -GCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCA -GCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAG -GGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTA -GAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCC -ACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAA -ATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCAT -GCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACT -ACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGA -GAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCT -ACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGG -TTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAA -ACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCA -GCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAA -GCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGA -GGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCAC -ATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGA -CATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCC -CACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAA -GAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGAC -AAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAA -TAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTAT -TAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTT -TTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAG -GTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGC -TTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGC -CAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCAT -TAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAA -ATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAAT -TAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAA -TACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATG -CATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTA -GTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGA -AAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGC -AAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAG -AAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGAC -TTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAAC -TCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTG -TCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGA -TTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTAC -CACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAG -TACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCA -ATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAAT -ATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAA -AGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATAC -AAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGT -GGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCA -TAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCA -AAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAA -ATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAA -ACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTG -AATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGG -CATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTA -CTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGA -AATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAA -AAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAG -TAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCC -TGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAG -GGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATAC -ATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAG -GGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCA -TGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGA -CAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGT -ATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTAC -AGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCAC -TTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATA -ATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAAC -AGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGT -TTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCAC -TATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGA -TTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAG -GGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCA -GACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCC -ATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGC -TCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTA -CCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCAC -AGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGG -TTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATG -GGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTC -ATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAA -ATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACT -CCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAA -AAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAA -GGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCT -CTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGG -ACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATT -GATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAA -TTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGC -TACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACAC -CACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACATAATGTTTGGGC -CACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGAC -AGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAA -TTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAA -TTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGA -AGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGA -ATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATAC -ATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCC -AATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAA -GTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAA -GCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAAT -TAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTAT -ACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGG -AAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCT -TAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATA -TGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCA -TACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTAC -TTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATG -CAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCC -CATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGG -TGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTG -GAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCAC -CAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTT -CCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGT -ACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTAT -TGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAG -AGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTC -TGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCT -GAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACAC -AGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGA -ATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCT -GTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTT -TGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGAC -CCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGA -AAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGA -CCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAAC -AAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCT -CCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGC -CATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGC -TCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGG -GGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGAC -GAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAG -CAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAG -AAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTT -TCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAA -TTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACT -TCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGT -GGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCT -TGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGA -AGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACA -AAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAG -GTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGC -GTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCT -AACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115211.1 CTTCTAGCCTCCGCTAGTCAAAACGCCGCCCCTCGCCTCTTGCCGTGCGCGCTTCAGCAA GCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCG @@ -2777,165 +2295,6 @@ CATAGAGTTTTCCACCAGGGACTTTCCAGAAGAGGCGTGGCCTGGGCGGGACCGGGGAGT GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTGCCTGTACTGGGTCTCTCTGGT TAGACCAGATCTGAGCCTGGGAGCTCTCTGTCTAACTAGGGAACCCACTGCTTAAGCCTC AATAAAGCTTGCCTTG ->MK115491.1 -CTGATTTGCTGTGGCGGCCGCAAGGACTCAAGTAGGTAACTATAGAAACCCCCCACCAAT -TCTCTAGCAGTGGCGTCCGACGCTGGCCAAAACTCTCTAGCAGTGGCGCCCGAACAGACT -CTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAG -ATCCCAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATC -TCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTG -GCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCGCCC -GACTCTGGTAACTAGAGATCCCTCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTA -GAGACTCAGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACG -CCGAAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAA -TATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGA -AAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTA -ACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCAT -CCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATT -GTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAG -AGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAA -ACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCC -TATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAG -AAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCA -TGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATG -AGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCC -AGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAA -TAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAA -TCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAAC -AAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTG -AGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGA -ATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGA -TGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAA -TGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAA -AGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCC -CTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAG -AGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACT -TCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAG -AGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTT -CCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAA -AGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGG -AAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGA -TCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTAC -ACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCC -CATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGT -TAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAAT -GGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATT -TGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAA -TAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAA -AAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGA -TAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGG -GATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCA -AAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTA -TCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAA -AATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACA -TCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGT -ACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGT -GGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAA -ACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCT -AGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCC -ATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAAT -TTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCA -CACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGT -AATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATG -GTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCC -CTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTA -TGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAG -AGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGC -AATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATA -TACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGAT -AATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGG -AATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATT -TCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGC -AATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGA -TAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATG -GCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAG -TGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCT -CCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTT -CACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCAT -TCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAAT -TATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATT -CATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGT -AGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCA -AAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCT -TCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCC -AAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGT -GGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATG -TTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAA -TAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGG -GCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAA -AAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATT -ACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTC -CTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAA -AAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAG -AGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATG -GACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTG -GCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGA -GGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACA -TAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGAC -TAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTA -AAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATG -GCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATT -CTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAG -GATTAGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATA -GGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAA -AAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGG -GGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACA -GTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGAT -GCTAAAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACA -GACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAA -AATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAG -CCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACT -AATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTC -AATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTT -GATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCA -GTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCC -CCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGT -AAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTA -CTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAAC -AATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCC -AACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGA -GCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAAT -ACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTT -AATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAA -TTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGG -AATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAAC -AGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGT -TCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAG -ACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATAT -AAAGTAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTG -CAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCA -GGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCT -GGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTG -CAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATAC -CTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACT -GCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATG -ACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATT -GAAAAGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGG -GCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATA -ATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAAT -AGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGA -CCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTT -CGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTC -CTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGA -CGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAG -CTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACA -GATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGA -ATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAG -TGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGG -GGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGC -AGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTT -TCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAG -CCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGA -TATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACAC -ACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGT -GGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCA -TGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATT -TCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTT -CTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGG -GAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCT -CTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAA -GCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTAGTGTGTGCCCGTCTGTTGTGTGACTC -GCGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACTCTGG -TA >MK116110.1 CCTGAAAGCGAAAGTAGAACCAGAGAAGTTCTCTCGACGCAGGACTCGGCTTGCTGAGCT TTATGGCCGGGTCCCCCCACTCCCTGACATGCTGTCATCATTTCTTCTAGTGTAGCTGCT @@ -3087,166 +2446,6 @@ CTGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCCGCTTTCGCCTGTACTGGGTC TCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAGCTGGGGAACCCACTGCT TAAGCCTCAATAAAGCTTGCCTTGAGTGCTTAAAGTAGTGTGTGCCCGTCTGTTGTGTGA CTCTGGTAGTTACCAGAGTCACACAAC ->MK115527.1 -ACCTATTACAGCCCATAAAGAGGAGAAACGAACATAAAGCTAGTGCAAACCTGACTGCCC -GAGGCAGGGAGCTAGAGTTAGGTAACTAAAGCTCAATCACTAGCGCTCGAGCATGAGGGA -CTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACATAAATCTCT -AGCAGTGGCGCCCTAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAG -CAGTGGCGCCCGAACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCA -GTGGCGCCCGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGA -ACATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAAC -ATGAGGGACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGGCGCCCGAACAT -GACTCTGGTAACTAGAGATCCCTCATTAAATCTCTAGCAGTGCGCGACATGAGGCTCGGT -AACTAGAGATCCTCAGTAAATCCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAA -GCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGAC -TAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAAT -TAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAAC -ATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAA -CATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAG -AAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATAC -AGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGA -AAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACC -CCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAA -ATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTT -CAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGG -GACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGG -ATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGG -GAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATA -ATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAA -TAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCT -TTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGG -TAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTA -TTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAG -TGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAG -CTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCA -ATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTT -GGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTT -TAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAG -AGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTC -AGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTG -GCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATAC -AGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAAT -GATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAAT -CTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGG -AAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAAC -TGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGAC -AGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAAT -TTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGA -CAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTT -TTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAAC -AGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTA -TACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAA -TGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAAT -CTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTT -GTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACA -ACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATT -CCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCC -AGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGC -AAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAA -AGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAG -GGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGC -AGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAA -AAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACA -ATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCC -TAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCA -AGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTA -CCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAA -TAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTAT -CTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCA -GGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCA -AGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAA -AAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACA -AGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAA -GGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAA -TATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGG -AGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACA -TCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGA -AGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAG -ATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAA -GGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAG -TCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGA -TCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAG -AAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGA -CCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTA -CAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGG -GGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAAT -CATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGA -GGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAG -GATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACA -TCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAA -GAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACAC -AAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAG -AATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAG -CAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAA -AGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGC -ACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGA -GGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACA -ACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCT -GCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGT -GCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACC -CAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATT -GCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGAC -AGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAG -TAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAA -TAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAA -AAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGA -GTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGG -ATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCT -GTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACA -GAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAA -GTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAG -ATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACC -CCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGT -GAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATA -AGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGAT -AATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGT -CCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATT -CTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTA -CAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTA -GCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATA -GTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAA -AGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATA -AGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTT -GAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGG -GACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACA -ACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGAT -GGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGA -AAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGG -TTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGA -GGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAG -CCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCA -GTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCA -GCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAA -AACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGC -ATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGC -CTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCT -AGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAA -AGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAG -CAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGG -TTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTG -ATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATAT -TCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGA -ATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTC -TTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGA -GACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATC -CTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATT -AGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTA -GTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAA -AGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGC -TGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCG -AGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTG -CGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGT -GCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAA -GGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGT -CTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAG -ATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAA -TCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGA -AAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGA -GAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCG -CTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGA -TGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTG -AGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCC -T >MK114997.1 TGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTTTCAAGTCCCTGTTCGGGCGCCACT GCTAAGATTAGGGACCTGAAAGCGAAAGAGAAACCAGAGGAGCTCTCTCGACGCAGGACT @@ -3399,166 +2598,6 @@ CTGCATCCGGAATATTTCAAGGACTGCTGACACTGAGATTTCTACAAGGGACTTTCCGCT GGGGACTTTCCAGGGGAGGCGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCTCAGATG CTGCATATAAGCAGCTGCTTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAG CCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT ->MK115518.1 -TCCATTGCCCAGTTGTATCAGCTCAAGCTAGTTTCGCACAGAACCCTCTTACAAGAGCTG -CCGCCGAGACCGATACTAGTAGCGAGCGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCT -AGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGG -CGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGACTCTGGTAAC -TAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACCTCCTAAATCTCTAGCAGTGG -CGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTC -CTAAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCCTCCTAAATCTCT -AGCAGTGGCGCCCGAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGC -CCGACTCTGGTAACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAACTCTGGACT -CTGAAAGCGAAAGTAAAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCG -CGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGC -GGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGA -TGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTT -AGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATC -AGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGA -ACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGT -ACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAA -GGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCAT -AGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGC -ATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGC -ATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACA -TCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAG -ATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAG -TGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCC -ACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGT -AAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAG -AGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAA -AAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTT -AAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGG -GGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAA -TGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTG -TGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAA -ATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGG -GAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCC -AACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAA -GCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAG -CGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGA -GCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATA -GGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGT -GGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGA -AATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTA -CCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAA -GAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCA -AAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGT -ACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGG -GAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTA -CTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACT -GCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTG -CTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTA -GAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTAT -GTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACAT -CTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTT -TGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAA -AAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGT -CAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCA -CTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAA -ATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAA -GTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAAT -CTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTA -ACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAA -TTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCC -ACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAA -TTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGA -GAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCC -CTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGAT -TCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCA -CAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAG -GAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTA -GACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCC -CAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATA -CCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAG -GCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTA -GAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTT -ATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGG -CCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCC -GCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAA -GGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAG -GCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAA -GGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTA -CAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGG -GACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCA -GTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATT -AGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGAT -TAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATG -GTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCC -ACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGA -ATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGT -TGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATC -TGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGG -ACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAG -AAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCA -GAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAA -CTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACAT -ATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAA -CAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCA -CAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGG -AAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCA -AGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCG -ACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGT -ATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAATAGTAGCAGCAATAAT -AGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAG -GATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGA -AGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGT -TGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTAT -GGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCCCAGAGG -CACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAG -GATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGC -ATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCAC -TCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGG -AGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAA -ATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATG -ATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAA -AGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAA -AGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAAT -GTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAG -AAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTAC -ATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTA -TCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGAC -AAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAA -AATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACC -CAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACAC -AGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAA -ACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAG -CAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTAC -TATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAG -ATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCAT -TAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGG -GAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGT -CAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACA -ATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCA -AGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGG -GAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTT -GGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAG -AAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGG -AAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTA -ACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAG -GTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCAC -CATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCG -AAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGG -CACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACT -TACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCA -AACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCT -TATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTAC -AAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGG -CATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTA -AGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGAC -CTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCC -TGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCT -TTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGG -GGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTAC -AACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATAT -CCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAA -GGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGATGGAGGACCCGGAAAAA -GAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAG -CATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGG -GGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCT -GCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCC -TGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115065.1 TAGCCTCCGCTAGTCAAAAATTTCGGCGTACTCACCAGTCGCCGCGCCTCGCCTCTTGCC GTGCGCGCTCAGCAAGCCGAGTCCTGCGTCGAGAGAGCTCCTCTGGTTTCTCTTTCGCTT @@ -3877,167 +2916,6 @@ AAGAGGCGTGGCCTAGGCAGGACCGAAGAGTGGCGAGCCCTCAGATGCTGCATAAAAGCA GCTGCTTTTGCCTGTACTAGGTCTCTCTAGTTAGACCAGATCTGAGCCTAGGAGCTCTCT GTCTAACTAAGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTTAAGTA GTG ->MK115530.1 -TAACTAGCAGTCCCCCGCGGCGGCCCGGCAATGGCTGGACCCGACCCCCCAACCCCTGCC -GCCGGCGCCGACTATCGAGACTGGTAACCCCCCACCCCCCAACCCTAGCCGCGCGGCCCG -ACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAGC -AGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCATCCCAAATCTCTAGCAGTGG -CGCCCGAACAGACTCTGGTAACTAGAGATCCCCAGCTCTAGCAGTGGCGCCCGCGACTCT -GGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGAAATCTCTAG -CAGTGGCGCCCGACTGACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGG -CCCCGAGCTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACA -GACTCTGGTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTACTCCAATCTCAGCAGCTCTCTCGGCGCAGGACTCGGCTTGC -TGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTT -GACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAA -AATTAGATTCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAA -AACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAG -AAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGAT -CAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGA -TACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTA -AGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATT -ACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTT -TAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGT -TTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGG -GGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAAT -GGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAA -GGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAA -ATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATA -AAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAAC -CCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGG -AGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGA -CTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAG -GAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATT -CAGTTAATGTAATGATGCAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTT -TCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCT -GTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATT -TTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGAC -CAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCT -CTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCT -TTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGA -TACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAA -AATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGA -AATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAAT -TGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGA -AACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATT -GACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAA -AATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAA -AGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGA -CTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGT -AACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAA -GTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTA -CAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAA -AATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGA -TTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAG -ACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCC -ATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACT -GCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTG -GGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAAC -CAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAA -CAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAAT -AGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATT -TAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAA -ACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAAC -TCCTAAATTTAGACTACCTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTG -GCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATG -GTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGC -TAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGT -TATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTT -GCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCAT -TCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAAT -AAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGA -ACAAGTAGACAAACTAGTCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGA -TAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTT -TAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAA -AGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTAC -ACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGC -AGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGG -GAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGT -TAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCA -AAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAG -AGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAA -AAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAAC -AGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTA -TTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGA -AGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAA -AATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGA -TGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTA -AAGGATGGTTTTATAGACATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTAC -ACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAG -AAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCA -CACAAGTTGACCCTGACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTT -CAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATC -AAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACAC -CAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACG -AGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTT -AGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGG -ACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAAC -CCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCAT -TGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGC -ACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTC -ATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGA -GACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGT -AAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAG -CAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGAC -AAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATG -AGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTG -GGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTA -CCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACC -ACAGAGTCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAA -GAAGTAGGATTGGAAAATGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAA -CAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTA -ACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGT -AGTAAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAA -ATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATA -GATGATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCC -TGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCG -ATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACA -GTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGT -TTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATA -ATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATG -AAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGAT -ATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTA -GTTGAAAAATTAAAAGAACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGA -GGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAAT -ACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTA -GATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTA -GGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACA -GGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGA -GGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATT -GAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGA -GCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGC -GCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAG -CAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGG -GGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAG -CGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAAT -GCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGG -GAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAAC -CAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAAT -TGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGA -TTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGA -TATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAA -GGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGA -TTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTG -AGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAA -ATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCT -ATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAA -GTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTG -GAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCC -TGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATC -TCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGA -TTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCA -GGTGCCTTTAAGACCAATGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGA -AAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTG -GGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGAC -CAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGC -CAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCC -GGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCG -AGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTT -TCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTC -AGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGAT -CTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTT -GCCT >MK115520.1 ATCTCTAGCAGAAGCGCCCGACCAGACTCTGGCGACCGGACACCGTTCATCCCTTGGAGA CCCGCCAGACTCAAGCTATTGCAGTGGCGCCCGACTCTGGAACTAGAGATCCCTCACCCT @@ -4199,168 +3077,6 @@ AGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTC TGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAG CCTCAATAAAGCTTTGCCTTCTAGATGTGTACAATCTAGTTGCCATATTCCTGGACTACA ATCTACTTGTCCATGCATGGCCTCTCCTTTTGCTGACATTTATCACAGC ->MK115503.1 -GCTCTCGAACAGTGCGGACTCTGGTAACTAGAGATCCCTCAGCTCTAGCAGTGGCGCCCG -AACAGAATCTCTAGCAGTGGCGCCCGACGACTCTGGTAACTAGAGATCCTAAATCTCTAG -CAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCCTACTCTAGCAGTGGCGCCCAGA -ACATGGACTCTGGTAACTAGAGACCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGT -AACTAGAGATCCCTCCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAG -ATCCCTCCTAACTCTAGCAGTGCGCCCGACTCTGGTAACTAGAGATCCTAAATCTCTAGC -AGTGGCGCCCGACAGACTCTGGTAACTAGAGATCCCTCACCTAAATCTCTAGCAGTGGCG -CCCGAGAACAGATCTGGTAACTAGAGCCCTACTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGGACTCTGGTAACT -AGAGATCCTCCTAAATCTCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATC -CCTCAGCTCTAGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGGGACTCTGGT -AACTAGAGATCCTCACTAAATCTAGCAGTGGCGCCGAGAGGAGACTCTCTCGGCGCAGGA -CTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGA -AAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATT -AAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAA -ATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCC -TGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTACAACCATCCCT -TCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGT -ACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCA -AAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAG -CAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATC -ACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGT -CATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCT -AAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGA -AGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGAT -GAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGC -ATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTT -GGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGG -ACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCA -AGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCC -AGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAGGAAATGATGAC -AGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAG -CCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGAT -TGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAG -GAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAG -ACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCT -TCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGAC -AATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCT -CAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAA -GCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAA -TGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAG -ATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAGGACCTACACCT -GTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATT -AGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAA -CAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAA -AAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCT -ATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAG -AGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAG -AAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAA -GAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGACACCAGGGATT -AGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGT -AGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAA -TACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATA -GAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACAAAAAACATCAG -AAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAG -CCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGA -AAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTC -CTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAA -CTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATTATGACCCATCA -AAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACATATCAAATTTAT -CAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACT -AATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATA -TGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGGAGACATGGTGG -GCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTA -GTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTA -GATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGA -AGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGTTACAAGCAATT -TATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACTCACAATATACA -TTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATA -GAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATT -GGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTA -GATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATTGGAGAGCAATG -GCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAA -TGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAA -CTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGA -TATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTG -AAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCAGCAATTTCACC -AGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCC -TACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATA -GGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGGCAGTATTCATC -CACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGAT -ATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAAAAATTCAAAAT -TTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTC -TGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGG -AGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCA -AGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCATATGCATGTTTC -AAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCATCCAAGAATAAG -TTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCT -GAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAG -GAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCATCTGTATTACTT -TGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAG -GTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGC -ATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGA -TAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACA -TTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTC -CATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCC -ATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGC -AGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGA -GCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAA -GTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAG -GAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCT -ATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATT -AGTAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAA -AATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGA -CAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCA -CCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCT -ATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTA -AAGCATATACCACAGAGGCACATAATGTTTGGGCCACACATGCCTGTGTACCCACAGACC -CCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATA -ACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCAT -GTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAATGTTACTAATA -CCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATA -TCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTATAAACTTGATG -TAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAACACCTCAGTCA -TTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGG -CTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAA -ATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGT -TAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATG -CTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTACAAGACCCAACA -ACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCA -TAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTT -TAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAATAATCTTTAATC -ACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGGAGGGGAATTTT -TCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATG -CTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGATTATAAACAGGT -GGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCAT -CAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCT -TCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATATAAATATAAAG -TAGAAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAA -GAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAA -GCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTA -TAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAAC -TCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTAC -AGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTG -TGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGATAACATGACCT -GGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACACCTTAATTGAAA -AGGCGCAGAACCAGCAGGAAAAAAATGAACAAGAATTATTGGAATTGGATAAATGGGCAA -GTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATTATTCATAATGA -TAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAG -TTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCG -ACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGAT -TAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCT -GCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCA -GGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAA -AGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATA -GGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAA -GACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGG -GGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTG -GGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCT -ACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCA -GTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCAC -TTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATC -CTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCA -GGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAG -CCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGG -ATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCAT -CACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTAC -AAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGT -GGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGG -TTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCT -CAATAAAGCTTGCCTTG >MK115570.1 AACGTGTCGTGCCCCCAAAACATAACGTAAACGTGGAAGCGGAGAGCCTTAAGGTAACTG CGGGGCCCCAAATCCAATATCTAGGGCGCCCGAACGAGACTCTGGTAACTAGAGATCCCT @@ -4521,163 +3237,6 @@ TCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGGGACAGGGGAGTGGCGAGCCCT CAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGA TCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCT TGCCT ->MK115509.1 -CCCCAAATCTCTAGCCGCCCGAACAGACTCTGGTAACTAGAGATCCCTCCCCAAATCTCT -AGCAGTGGCGCCCGAACAGAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAGAGATCC -TAAATCTCTAGCAGTGGCGCCCGAAGACTCTGGTAACTAGAGATCCCTCACCCTAAATCT -CTAGCAGTGGCGCCCGCTCGTACTAGAGATCCTAAATCTCTAGCAGTGGCGCCCGAACAG -ACTCTGGTAACTAGAGATCCCTCACCCTAATCTCTAGCAGTGGCGCCCGAACAGACTCTG -GTAACTAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAAC -TAGAGATCCCTCACCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTACTAGAGA -TCCCTCAAATCAACCAGAGGAGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCAC -AGCAAGAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAAATTTTTGACTAGCGGAG -GCTAGAAGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATGCA -TGGGAAAAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTA -TGGGCAAGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAG -GGATGTAGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTT -AAATCATTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAA -GACACCAAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCA -CAGCAAGTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTG -CAGAACCTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGG -GTAAAAGTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTA -TCAGAAGGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAA -GCAGCTATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTG -CATCCAGTGCATGCAGGGCCTATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGAC -ATAGCAGGAACTACTAGTACCCTTCAGGAACAAATAGCATGGACGACAAATAATCCACCT -ATCCCAGTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGG -ATGTATAGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGAC -TATGTAGACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAAT -TGGATGACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAA -GCATTAGGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGA -CCAGGCCATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGCTAATGTA -ATGATGCAGAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGC -AAAGAAGGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGT -GGAAAGGAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAA -ATCTGGCCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACA -GCCCCACCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAG -GAGCCAAGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGAC -CCCTCGTCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAG -ATGATACAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGG -GAATTGGAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGAC -ACAAAGCTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATC -TGTTGACTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAG -TAAAATTAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAA -AAATAAAAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAA -TTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTA -AATGGAGAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAG -TTCAATTAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGG -ATGTGGGTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCAT -TTACCATACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGC -CACAGGGATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGC -CTTTTAGAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAG -GATCTGACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGT -TAAGGTGGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGA -TGGGTTATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAG -ACAGCTGGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGA -TTTACGCAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAA -CAGAGGTAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTT -TAAGAGAACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTAC -AGAAGCAGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGA -AAACAGGAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAG -AGGCAGTACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTA -GACTACCTATACAAAAAGAAACATGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCT -GGATTCCTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAG -AGAAAGAACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAA -CTAAATTAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAA -CGGACACAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGG -GATCAGAAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAAC -CAGATAAGAGTGAATCAGAGTTAGTCAATCAGATAATAGAGCAGTTAATAAAAAAGGAAA -AAGTCTACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACA -AACTAGTCAGTACTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAG -AAGACCATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCC -CTGTAGTAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCA -TGCATGGACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAG -GGAAAGTTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTC -CAGCAGAGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAG -TAAAAACAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCT -GTTGGTGGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAG -TAGTAGAATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTG -AACATCTTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGG -GGATTGGGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAA -CTAAAGAATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACA -GCAGAGATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAG -TAATACAAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGG -ATTATGGCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGA -ACATGGAACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTT -TATAGACATCACTATGAAAGCACTCATCCAAGAATAAGTTCAGAAGTACACATCCCACTA -GGGGATGCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGG -CATTTGGGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGAC -CCTAACCTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCT -ATAAGAAATGCCATATTAGGACATATAGTTAGTCCTAGGTGTGAATATCAAGCAGGACAT -AACAAGGTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGA -AAGCCACCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAG -ACCAAGGGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTA -AGAATGAAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCT -ATGAAACTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAAC -TGCTGTTTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGA -GGAGAGCAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGT -CAGCCTAAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTT -TGTTTCATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGA -AGAGCTCCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATAT -GTAATGCAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCA -ATAGTTGTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATA -GACAGGTTAATTGATAGAATAAGAGAAAGAGCAAAAGACAGTGGCAATGAGAGTGAAGGG -GATCAGGAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGAT -GATCTGTAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAA -AGAAGCAAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGGCACA -TAATGTTTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATT -GGAAAATGTGACAGAAAATTTTAACATGTGGAAAAATAACATGGTAGAACAGATGCATGA -GGATGTAATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTG -TGTTACTTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTGAGGAGGG -AAAGATGGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAAAAATAAGAAATAA -GATGCAGAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATAATGATAA -TACAAGTTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGT -ATCCTTTGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTG -TAAGGATAAGAAGTTCAATGGATCAGGACCATGTAAAAATGTCAGCACAGTACAATGTAC -ACATGGAATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGA -AGAGGTAGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCT -GAAGGAACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCC -TCTAGGACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGC -ACATTGTAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATT -AAAAGAACAATATGAGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGA -AATTATAATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCT -GTTTAATAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACAT -CACACTCCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAAT -GTATGCCCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATT -AGTAAGAGATGGTGGTAACACGAGCGAGACTGAGACCTTCAGACCTGGAGGAGGAGATAT -GAAGGACAATTGGAGGAGTGAATTATATAAATATAAAGTAGAAAAAATTGAGCCATTAGG -AGTAGCACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAAT -AGGAGCTGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGT -GACGCTGACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTT -GCTGAGAGCTATTGAGGCGCAACAACATCTGTTGCAACTCACAGTCTGGGGCATCAAGCA -GCTCCAGGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAAT -TTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAG -TAATAAATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAAT -TAACAATTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAA -AAATGAACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACAT -AACAAAATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTT -AAGAATAGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATT -ATCGTTTCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGA -AGAAGGTGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACT -TTTCTGGGACGACCTGCGGAGCCTGTGCCTCTTCCTCTGCCACCGCTTGAGAGACTTACT -CTTGATTGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACA -TTGGTGGAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATT -CAATGTCACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAG -AGCTTGTAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATT -GTTATAAAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGG -AAAGAATGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGG -AAAGACATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGC -TGGAAGCACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAA -GACCAATGACTTTCAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGAC -TGGAAGGGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCAC -TGACCTTTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAG -AGAACAACTGCTTGTTACACCCTATGAGCCTGCATGGGATGGAGGACCCGGAAAAAGAAG -TATTAATGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATC -CGGAGTACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTCCGCTGGGGAC -TTTCCAGGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCAT -ATAAGCAGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGG -AGCTCTCTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT >MK115702.1 GAATACTGCCATTTGTACTGCTGTCTTAAGATGTTCAGCCTGATCTCTGACCTGTCCTAT TATTTTCTTTAATTCTTTATTCATAGATTCTACCACTCCTTGACTCTGGGGATTGTAGGG @@ -4985,319 +3544,6 @@ GGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTCTGCCTGTACTAGGTCT CTCTGGTTAGACCAGATCTGAGCCTAGGAGCTCTCTGGCTAACTAGAGAACCCACTGCTT AAGCCTCAATAAAGCTTGCCTTGAGTGCTATAAGTAGTGTGTGCCCGTCTGTTGTGTGAC TCTGGTAACTAGAGATC ->MK115490.1 -CGCTAGTTTAGAGATACTCTTATAACTACAGAACACGCCAACCAAATCGCTAAGAGGGGG -GGCCCGACTGTGGTTACTAAAGATCCATCCAAAATCTCTAGCAGTGGCGCCCGAACAGAC -TCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGC -AGTGGCGCCCAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGA -ACAGACTCTGGTAACTAGAGATCCCTCCTAAATCTCTAGCAGTGGCGCCCGAACAGACTC -TGGTAACTAGAGATCCCTCAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTG -GCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGAACAAAATCTCTAGCAGTGGCGCCCGA -ACAAATCTCAGCAGGGGCTCTCTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAA -GAGGCGAGGGGCGGCGACTGGTGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGA -AGGGGAGAGATGGGTGCGAGAGCGTCAATATTAAGCGGGGGAAAATTAGATTCATGGGAA -AAAATTCGGTTAAGGCCAGGGGGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCA -AGCAGGGAGCTAGAACGATTTGCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGT -AGACAAATACTGGGACAGCTACAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCA -TTATTTAATGCAGTAGCAGTCCTCTATTGTGTACATCAAAGGATACAGGTACAAGACACC -AAGGAAGCTTTAGAGAAGGTAGAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAA -GTAGCAGCAGCTGACACTGACACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAAC -CTCCAGGGGCAAATGGTACATCAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAA -GTAGTAGAAGAAAAGGCCTTCAGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAA -GGAGCCACCCCACAAGATTTAAACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCT -ATGCAAATGTTAAAAGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCA -GTGCATGCAGGGCCTATTGCACCAGGTCAGATGAGAGAACCAAGGGGAAGTGACATAGCA -GGAACTACTAGTACCCTTCAGGAACAAATAGCATGGATGACAAATAATCCACCTATCCCA -GTAGGAGAAATCTATAAAAGATGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTAT -AGCCCTACCAGTATTCTGGATATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTA -GACCGGTTCTATAGAACTTTAAGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATG -ACAGAAACCTTGTTGGTCCAAAATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTA -GGACCAGCAGCAACACTAGAGGAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGC -CATAAAGCAAGAGTTTTGGCTGAAGCAATGAGCCAAGTAAATTCAGTTAATGTAATGATG -CAAAGAGGCAATTTTAGAAACCAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAA -GGGCACATAGCCAAAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAG -GAAGGACATCAAATGAAAGACTGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGG -CCTTCCCACAAAGGAAGGCCAGGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCA -CCAGAAGAGAGCTTCAGGTTTGGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCA -AGAGACAAGGAACTGTATCCCTTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCG -TCAGAATAAAGATAGGGGGGCAATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATA -CAGTATTAGAAGAAATGAGTTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTG -GAGGTTTTATCAAAGTAAGACAGTATGATCAGATACCCATAGAAATCTGTGGACACAAAG -CTATAGGTACAGTATTAATAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGA -CTCAGCTTGGTTGTACCTTAAATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAAT -TAAAGCCAGGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAA -AAGCATTAGTAGAAATTTGTACAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGC -CTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGA -GAAAATTAGTAGATTTCAGAGAACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAAT -TAGGAATACCACATCCTGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGG -GTGATGCATATTTTTCAATTCCCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCA -TACCTAGTACAAATAATGAGACACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGG -GATGGAAAGGATCACCAGCAATATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTA -GAAAGCAAAATCCAGATATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTG -ACTTAGAAATAGGGCAGCATAGAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGT -GGGGACTTACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTT -ATGAACTCCATCCTGATAAGTGGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCT -GGACTGTCAATGACATACAGAAGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACG -CAGGGATTAAAGTAAGGCAATTATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGG -TAGTACCACTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAG -AACCAGTACATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGC -AGGGCAATGGACAGTGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAG -GAAAATATGCAAGAATGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAG -TACAAAAGATAGCCACAGAAAGCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTAC -CTATACAAAAAGAAACGTGGGAGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTC -CTGAGTGGGAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAG -AACCCATAGTAGGAGCAGAAACTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAAT -TAGGCAAAGCAGGATATGTCACTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACA -CAACAAATCAAAAGACTGAGTTACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAG -AAGTAAACATAGTAACAGACTCACAATATACATTAGGAATCATTCAAGCACAACCAGATA -AGAGTGAATCAGAGTTAGTCCATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCT -ACCTGGCATGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAG -TCAGTGCTGGAGTCAGGAGAGTACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACC -ATGAGAAATATCACAGTAATTGGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAG -TAGCAAAAGAAATAGTAGCCAGCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATG -GACAAGTAGATTGTAGTCCAGGAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAG -TTATCCTGGTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAG -AGACAGGGCAGGAAACAGCATACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAA -CAATACATACAGACAATGGCAGCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGT -GGGCAGGGATCAAGCAGGAATTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAG -AATCCATGAATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATC -TTAAGACAGCAGTACAAATGGCAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTG -GGGGGTATAGTGCAGGGGAAAGAATAGTAGATATAATAGCAACAGACCTACAAACTAAAG -AATTACAGAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAG -ATCCACTTTGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATAC -AAGATAATAGTGATATAAAAGTAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATG -GCAAACAGATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGG -AACAGTTTAGTAAAACACCATATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGA -CATCACTATGAAAGCACACATCCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGAT -GCTAGATTGGTAGTAACAACATATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTG -GGTCAGGGAGTCTCCATAGAATGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTGAC -CTAGCAGACCAACTAATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGA -AATGCCATATTAGGACATATAGTTAATCCTAGGTGTGAATATCAAGCAGGACATAACAAG -GTAGGCTCTCTACAATACTTGGCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCA -CCTTTACCTAGTGTTAGGAAACTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAG -GGCCACAGAGGGAGCCATACAATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATG -AAGCGGTTAGACATTTTCCTAGGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAA -CTTATGGGGACACTTGGACAGGAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGT -TTATTCATTTCAGACTTGGGTGTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAG -CAAGAAATGGAGCCAGTAGATCCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCT -AAAACTCCTTGTACTAACTGCTATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTC -ATAAAAAAAGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCT -CCTCAAGGCAGTCAGACTGATCAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATG -CAACCTCTGCACATAGCAGCAATAGTAGGATTAGTAGTAGCAGCAATAATAGCAATAGTT -GTGTGGACCATAGTGTTAATAGAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGG -TTAATTGATAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAG -GAAGAATTGTCAGCGCTTATGGAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTG -TAGTGCTACAGAAAAATTGTGGGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGC -AAACACCACTCTATTTTGTGCATCGGATGCTAAAGCATATACCACAGAGTCACATAATGT -TTGGGCCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAA -TGTGACAGAAAATTTTAATATGTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGT -AATCAATTTATGGGATCAAAGCCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTAC -TTTAAATTGCACTAATCTGAATGTTACTAATACCAATAGCAGTAGTAAGGAGGGAAAGAT -GGCGGAAGAAATGAGAAACTGCTCTTTCAATATCACCACAGAAATAAGAAATAAGATGCA -GAAGGAATATGCACTTTTTTATAAACTTGATGTAGTACCAATAGATGATGATAATACAAG -TTATACATTGATAAATTGTAACACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTT -TGAGCCAATTCCTATACATTATTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGA -TAAGAAGTTCAATGGATCAGGACCATGTAAAAGTGTCAGCACAGTACAATGTACACATGG -AATTAAGCCAGTAGTGTCAACTCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGT -AGTAATTAGATCTGAAAATTTCACGAACAATGCTAAAACCATAATAGTACATCTGAAGGA -ACCTATACAAATTAATTGTACAAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGG -ACCAGGAAGAGCATTCTATGCAACAGGAGCCATAATAGGAGATATAAGACAAGCACATTG -TAACCTTAGTAGAAAAGCATGGAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGA -ACAATATGGGAATAAAACAATAATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTAT -AATGCATACTTTTAATTGTGGAGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAA -TAGTACTTGGAATAGTACTTGGACTGGGAATGCTACCGAATTAGATGGAAACATCACACT -CCCATGCAGAATAAAACAGATTATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGC -CCCTCCCATTAGAGGAAAAATTAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAG -AGATGGTGGTAACACGAGCGGGACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGA -CAATTGGAGGAGTGAATTATATAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGC -ACCCACCAGGGCAAAGAGAAGAGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGC -TGTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCT -GACGGTACAAGCCAGGCTGTTATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAG -AGCTATTGAGGCGCAACAACATCTATTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCA -GGCAAGAGTCCTGGCTGTGGAAAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGG -TTGCTCTGGAAAACTCATTTGCACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAA -ATCTCTGAATCAGATTTGGGATAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAA -TTACACAGACACAATATACACCTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGA -ACAAGAATTATTGGAATTGGATAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAA -ATGGCTGTGGTACATAAAATTATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAAT -AGTTTTTGCTGTACTTGCTATAGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTT -TCAGACCCACCTCCCAGCCCCGAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGG -TGGAGAAAGAGACAGAGACAGATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTG -GGACGACCTGCGGAGCCTGTGTCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGAT -TGTAACAAGGATTGTGGAACTTCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTG -GAGTCTCCTGCAGTATTGGATTCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGT -CACAGCCATCGCAGTAGCTGAGGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTG -TAGAGCTCTTCTCCACATACCTACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATA -AAATGGGGGGCAAGTGGTCAAAAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAA -TGAGACGAACTGAGCCAGCAGCAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGAC -ATGGAGCAGTCACAAGTAGCAATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAG -CACAAGAAGAGGACAGTGAAGTGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAA -TGACTTACAAAGGAGCTCTCGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAG -GGCTAATTTACTCCCAAAAAAGACAAGATATCCTTGACCTGTGGGTCTACAACACACAAG -GCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGACCAGATATCCACTGACCT -TTGGGTGGTGTTTCAAGCTAGTACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACA -ACTGCTTGTTACACCCTACGAGCCTGCATGGGGTGGAGGACCCGGAAAAAGAAGTATTAA -TGTGGAAGTTTGACAGCCGCCTAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGT -ACTACAAAGACTGCTGACATTGAGCTTTCTACAAAGGGACTTTTCGCTGGGGACTTTCCA -GGGGAGGTGTGGCCTGGGCGGGACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGC -AGCTGCGTTCTGCCTGTAAGGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCT -CTGGCTAACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCT ->MK115576.1 -AACAGACTCTGGTAAGTAGTGGTCCGCTCAAAATCTCTAGCAGTGGCGCCCGACTCTGGT -AACTAGAGATCCCTCAAAATCTCTAGCAGTGGCGCCCGATCAAAATCTCTAGCAGTGGCG -CCCGAGACTCTGGAACTAGAGATCCAATCTCTAGCAGTGGCGCCCGACTCTGGTAACTAG -AGATCCCTCAGTGAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCC -CTCAAAATCTCTAGCAGTGGCGCCCGAACAGACTCTGGTAACTAGAGATCCAAATCTCTA -GCAGTGGCGCCCGACTCTGGTAACTAGAGATCCCTCAGTGAAATCTCTAGCAGGAGCTCT -CTCGGCGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGCGACTGG -TGAGTACGCCGAAAAAATTTTTGACTAGCGGAGGCTAGAAGGGGAGAGATGGGTGCGAGA -GCGTCAATATTAAGCGGGGGAAAATTAGATGCATGGGAAAAAATTCGGTTAAGGCCAGGG -GGAAAGAAAAAATATAGATTAAAACATTTAGTATGGGCAAGCAGGGAGCTAGAACGATTT -GCCGTTAACCCTGGCCTGTTAGAAACATCAGAGGGATGTAGACAAATACTGGGACAGCTA -CAACCATCCCTTCAGACAGGATCAGAAGAACTTAAATCATTATTTAATGCAGTAGCAGTC -CTCTATTGTGTACATCAAAGGATACAGGTACAAGACACCAAGGAAGCTTTAGAGAAGGTA -GAGGAAGAGCAAAACAAAAGTAAGAAAAAGGCACAGCAAGTAGCAGCAGCTGACACTGAC -ACAGGAAACAGCAGCCAAAATTACCCCATAGTGCAGAACCTCCAGGGGCAAATGGTACAT -CAGCCCCTATCACCTAGAACTTTAAATGCATGGGTAAAAGTAGTAGAAGAAAAGGCCTTC -AGCCCAGAAGTCATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACAAGATTTA -AACACCATGCTAAACACAGTGGGGGGACATCAAGCAGCTATGCAAATGTTAAAAGAAACC -ATCAATGAGGAAGCTGCAGAATGGGATAGATTGCATCCAGTGCATGCAGGGCCTATTGCA -CCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACTACTAGTACCCTTCAG -GAACAAATAGCATGGACGACAAATAATCCACCTATCCCAGTAGGAGAAATCTATAAAAGA -TGGATAATCTTGGGATTAAATAAAATAGTAAGGATGTATAGCCCTACCAGTATTCTGGAT -ATAAAACAAGGACCAAAGGAACCCTTTAGAGACTATGTAGACCGGTTCTATAGAACTTTA -AGAGCTGAGCAAGCTTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTTGGTCCAA -AATTCGAATCCAGATTGTAAGACTATTTTAAAAGCATTAGGACCAGCAGCAACACTAGAG -GAAATGATGACAGCATGTCAAGGAGTGGGGGGACCAGGCCATAAAGCAAGAGTTTTGGCT -GAAGCAATGAGCCAAGTAAATTCAGCTAATGTAATGATGCAGAGAGGCAATTTTAGAAAC -CAAAGAAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAAGGGCACATAGCCAAAAATTGC -AGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACATCAAATGAAAGAC -TGTACAGAGAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAAAGGAAGGCCA -GGGAACTTCCTTCAGAGCAGACCAGAGCCAACAGCCCCACCAGAAGAGAGCTTCAGGTTT -GGGGAAGAGACAATAACTCCCTCTCAGAAGCAGGAGCCAAGAGACAAGGAACTGTATCCC -TTGTCTTCCCTCAAATCACTCTTTGGCAGCGACCCCTCGTCAGAATAAAGATAGGGGGGC -AATTTAAAGAAGCTTTATTAGATACAGGAGCAGATGATACAGTATTAGAAGAAATGAGTT -TGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAAGTAAGAC -AGTATGATCAGATACCCATAGAAATCTGTGGACACAAAGCTATAGGTACAGTATTAATAG -GACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAGCTTGGTTGTACCTTAA -ATTTTCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCAGGAATGGATGGCC -CAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTAGTAGAAATTTGTA -CAGAAATGGAAAAGGAAGGAAAAATTTCAAAAATTGGGCCTGAAAATCCATACAATACTC -CAGTATTTGCTATAAAGAAAAAAGACAGTACTAAATGGAGAAAATTAGTAGATTTCAGAG -AACTCAATAAGAGAACTCAAGACTTTTGGGAAGTTCAATTAGGAATACCACATCCTGCAG -GGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCATATTTTTCAATTC -CCTTAGATAAAGAATTCAGGAAGTATACTGCATTTACCATACCTAGTACAAATAATGAGA -CACCAGGGATTAGGTATGAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCAGCAA -TATTCCAAAGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAGCAAAATCCAGATATAG -TTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAAATAGGGCAGCATA -GAACAAAAATAGAGGAACTGAGACAACATCTGTTAAGGTGGGGACTTACCACACCAGACA -AAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTCCATCCTGATAAGT -GGACAGTACAGCCTATAATACTGCCAGAAAAAGACAGCTGGACTGTCAATGACATACAGA -AGTTAGTGGGAAAATTAAATTGGGCAAGTCAGATTTACGCAGGGATTAAAGTAAGGCAAT -TATGTAAACTCCTTAGGGGAACCAAAGCACTAACAGAGGTAGTACCACTAACAGAAGAAG -CAGAGCTAGAACTGGCAGAAAACAGGGAAATTTTAAGAGAACCAGTACATGGAGTGTATT -ATGACCCATCAAAAGACTTAATAGCAGAAGTACAGAAGCAGGGCAATGGACAGTGGACAT -ATCAAATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATATGCAAGAATGAGGG -GTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTACAAAAGATAGCCACAGAAA -GCATAGTAATATGGGGAAAAACTCCTAAATTTAGACTACCTATACAAAAAGAAACATGGG -AGACATGGTGGGCAGAGTACTGGCAAGCCACCTGGATTCCTGAGTGGGAGTTTGTCAATA -CCCCTCCCTTAGTGAAATTATGGTACCAATTAGAGAAAGAACCCATAGTAGGAGCAGAAA -CTTTCTATGTAGATGGGGCAGCTAATAGAGAAACTAAATTAGGCAAAGCAGGATATGTCA -CTGACAGAGGAAGACAAAAGGTTATCTCCCTAACGGACACAACAAATCAAAAGACTGAGT -TACAAGCAATTTATCTAGCTTTGCAGGATTCGGGATCAGAAGTAAACATAGTAACAGACT -CACAATATACATTAGGAATCATTCAAGCACAACCAGATAAGAGTGAATCAGAGTTAGTCA -ATCAGATAATAGAGCAGTTAATAAAAAAGGAAAAAGTCTACCTGGCATGGGTACCAGCAC -ACAAAGGAATTGGAGGAAATGAACAAGTAGACAAACTAGTCAGTACTGGAGTCAGGAGAG -TACTATTTCTAGATGGAATAGATAAGGCCCAAGAAGACCATGAGAAATATCACAGTAATT -GGAGAGCAATGGCTGGTGATTTTAATATACCCCCTGTAGTAGCAAAAGAAATAGTAGCCA -GCTGTGATAAATGTCAGCAAAAAGGAGAGGCCATGCATGGACAAGTAGATTGTAGTCCAG -GAATATGGCAACTAGATTGTACACATCTAGAAGGGAAAGTTATCCTGGTAGCAGTTCATG -TAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAGACAGGGCAGGAAACAGCAT -ACTTTCTCCTGAAACTAGCAGGGAGATGGCCAGTAAAAACAATACATACAGACAATGGCA -GCAATTTCACCAGTAATGTGGTTAAGGCCGCCTGTTGGTGGGCAGGGATCAAGCAGGAAT -TTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCCATGAATAAAGAATTAA -AGAAAATTATAGGACAGGTAAGAGATCAGGCTGAACATCTTAAGACAGCAGTACAAATGG -CAGTATTCATCCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTATAGTGCAGGGGAAA -GAATAGTAGATATAATAGCAACAGACCTACAAACTAAAGAATTACAGAAACAAATTACAA -AAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTTTGGAAAGGACCAG -CAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGATAATAGTGATATAAAAG -TAGTGCCAAGGAGAAAAGCAAAAATCATTAGGGATTATGGCAAACAGATGGCAGGTGATG -ATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAACAGTTTAGTAAAACACCAT -ATGCATGTTTCAAAGAAAACTAAAGGATGGTTTTATAGACATCACTATGAAAGCACTCAT -CCAAGAATAAGTTCAGAAGTACACATCCCACTAGGGGATGCTAGATTGGTAGTAACAACA -TATTGGGGCCTGAATACAGGAGAAAGAGAATGGCATTTGGGTCAGGGAGTCTCCATAGAA -TGGAGAAAAAGGAAATATAGCACACAAGTTGACCCTAACCTAGCAGACCAACTAATTCAT -CTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAATGCCATATTAGGACATATA -GTTAGTCCTAGGTGTGAATATCAAGCAGGACATAACAAGGTAGGCTCTCTACAATACTTG -GCACTAAAAGCATTAACAACACCAAAGAGAAGAAAGCCACCTTTACCTAGTGTTAGGAAA -CTGACAGAGGATAGATGGAACGAGCACCAGAAGACCAAGGGCCACAGAGGGAGCCATACA -ATGAATGGACATTAGAGCTTTTAGAGGAACTTAAGAATGAAGCGGTTAGACATTTTCCTA -GGCCGTGGCTCCATGGCTTAGGACAACATATCTATGAAACTTATGGGGACACTTGGACAG -GAGTGGAGGCCATAATAAGAACCCTGCAACAACTGCTGTTTATTCATTTCAGACTTGGGT -GTCGACATAGCAGAATAGGCATTGTGCCACAGAGGAGAGCAAGAAATGGAGCCAGTAGAT -CCTAGACTAGAGCCCTGGAAGCACCCAGGAAGTCAGCCTAAAACTCCTTGTACTAACTGC -TATTGTAAAAAGTGTTGCTTTCATTGCCAAGTTTGTTTCATAAAAAAAGCCTTAGGCATC -TCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTCCTCAAGGCAGTCAGACTGAT -CAAGATTCTCTATCAAAGCAGTAAGTAGTATATGTAATGCAACCTCTGCACATAGCAGCA -ATAGTAGGATTAATAGTAGCAGCAATAATAGCAATAGTTGTGTGGACCATAGTGTTAATA -GAATATAGGAAAATATTAAGACAAAAAAGGATAGACAGGTTAATTGATAGAATAAGAGAA -AGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAATTGTCAGCGCTTATG -GAGATGGGGCACCATGCTCCTGGGGATGTTGATGATCTGTAGTGCTACAGAAAAATTGTG -GGTGACAGTCTATTATGGGGTACCTGTATGGAAAGAAGCAAACACCACTCTATTTTGTGC -ATCGGATGCTAAAGCATATACCCCAGAGGCACATAATGTTTGGGCCACACATGCCTGTGT -ACCCACAGACCCCAACCCACAAGAAGTAGGATTGGAAAATGTGACAGAAAATTTTAACAT -GTGGAAAAATAACATGGTAGAACAGATGCATGAGGATGTAATCAATTTATGGGATCAAAG -CCTAAAGCCATGTGTAAAATTAACCCCACTCTGTGTTACTTTAAATTGCACTAATCTGAA -TGTTACTAATACCAATAGCAGTAGTGAGGAGGGAAAGATGGCGGAAGAAATGAGAAACTG -CTCTTTCAATATCACCACAAAAATAAGAAATAAGATGCAGAAGGAATATGCACTTTTTTA -TAAACTTGATGTAGTACCAATAGATAATGATAATACAAGTTATACATTGATAAATTGTAA -CACCTCAGTCATTACACAGGCCTGTCCAAAGGTATCCTTTGAGCCAATTCCTATACATTA -TTGTGCCCCGGCTGGTTTTGCGATTCTAAAGTGTAAGGATAAGAAGTTCAATGGATCAGG -ACCATGTAAAAATGTCAGCACAGTACAATGTACACATGGAATTAAGCCAGTAGTGTCAAC -TCAACTACTGTTAAATGGCAGTTTAGCAGAAGAAGAGGTAGTAATTAGATCTGAAAATTT -CACGAACAATGCTAAAACCATAATAGTACATCTGAAGGAACCTATACAAATTAATTGTAC -AAGACCCAACAACAATACAATGAAAAGTATCCCTCTAGGACCAGGAAGAGCATTCTATGC -AACAGGAGCCATAATAGGAGATATAAGACAAGCACATTGTAACCTTAGTAGAAAAGCATG -GAATAATACTTTAAAACAGGTAGTTGAAAAATTAAAAGAACAATATGAGAATAAAACAAT -AATCTTTAATCACTCCTCAGGAGGGGACCCAGAAATTATAATGCATACTTTTAATTGTGG -AGGGGAATTTTTCTATTGTAATACAACACAGCTGTTTAATAGTACTTGGAATAGTACTTG -GACTGGGAATGCTACCGAATTAGATGGAAACATCACACTCCCATGCAGAATAAAACAGAT -TATAAACAGGTGGCAAGAAGTAGGAAAAGCAATGTATGCCCCTCCCATTAGAGGAAAAAT -TAGATGTTCATCAAATATTACAGGGTTACTATTAGTAAGAGATGGTGGTAACACGAGCGA -GACTGAGACCTTCAGACCTGGAGGAGGAGATATGAAGGACAATTGGAGGAGTGAATTATA -TAAATATAAAGTAGTAAAAATTGAGCCATTAGGAGTAGCACCCACCAGGGCAAAGAGAAG -AGTGGTGCAAAGAGAAAAAAGAGCAGTGGGAATAGGAGCTGTGTTCCTTGGGTTCTTGGG -AGCAGCAGGAAGCACTATGGGCGCAGCGTCAGTGACGCTGACGGTACAAGCCAGGCTGTT -ATTGTCTGGTATAGTGCAACAGCAAAACAATTTGCTGAGAGCTATTGAGGCGCAACAACA -TCTGTTGCAACTCACAGTCTGGGGCATCAAGCAGCTCCAGGCAAGAGTCCTGGCTGTGGA -AAGATACCTACAGGATCAACAGCGCCTGGGAATTTGGGGTTGCTCTGGAAAACTCATTTG -CACCACTGCTGTGCCCTGGAATGCTAGTTGGAGTAATAAATCTCTGAATCAGATTTGGGA -TAACATGACCTGGATGGAGTGGGAAAGAGAAATTAACAATTACACAGACACAATATACAC -CTTAATTGAAAAGGCGCAGAACCAGCAGGAAAAGAATGAACAAGAATTATTGGAATTGGA -TAAATGGGCAAGTTTGTGGAATTGGTTTAACATAACAAAATGGCTGTGGTACATAAAATT -ATTCATAATGATAGTAGGAGGATTGATAGGTTTAAGAATAGTTTTTGCTGTACTTGCTAT -AGTAAATAGAGTTAGGCAGGGATATTCACCATTATCGTTTCAGACCCACCTCCCAGCCCC -GAGGGGACCCGACAGGCCCGAAGGAATCGAAGAAGAAGGTGGAGAAAGAGACAGAGACAG -ATCAGTTCGATTAGTGAACGGATTCTTGGCACTTTTCTGGGACGACCTGCGGAGCCTGTG -CCTCTTCCTCTGCCACCGCTTGAGAGACTTACTCTTGATTGTAACAAGGATTGTGGAACT -TCTGGGACGCAGGGGGTGGGAAATCCTCAAACATTGGTGGAGTCTCCTGCAGTATTGGAT -TCAGGAGCTAAAGAGTAGTGCTATTAGCTTATTCAATGTCACAGCCATCGCAGTAGCTGA -GGGGACAGATAGGGTTATAGAAGTAGTACAAAGAGCTTGTAGAGCTCTTCTCCACATACC -TACAAGAATAAGACAGGGCTTGGAAAGGGCATTGTTATAAAATGGGGGGCAAGTGGTCAA -AAAGTAGTGGGGGTGGATGGCCTGCTGTAAGGGAAAGAATGAGACGAACTGAGCCAGCAG -CAGAAGGGGTGGGAGCAGTATCTCGAGACCTGGAAAGACATGGAGCAGTCACAAGTAGCA -ATACAGCAGCTACCAATGCTGATTGCGCCTGGCTGGAAGCACAAGAAGAGGACAGTGAAG -TGGGTTTTCCAGTCAGACCTCAGGTGCCTTTAAGACCAATGACTTTCAAAGGAGCTCTCG -ATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTTACTCCCAAAAAA -GACAAGATATCCTTGACCTGTGGGTCTACAACACACAAGGCTACTTCCCTGATTGGCAGA -ACTACACACCAGGGCCAGGGACCAGATATCCACTGACCTTTGGGTGGTGTTTCAAGCTAG -TACCAGTGGAGCCAGAAGAGGCCAATCAAGGAGAGAACAACTGCTTGTTACACCCTACGA -GCCTGCATGGGATGGAGGACCCGGAAAAAGAAGTATTAATGTGGAAGTTTGACAGCCGCC -TAGCATTTCATCACATGGCCCGAGAGAAGCATCCGGAGTACTACAAAGACTGCTGACATT -GAGCTTTCTACAAAGGGACTTTCCGCTGGGGACTTTCCAGGGGAGGTGTGGCCTGGGCGG -GACTGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCGTTCTGCCTGTAAGG -GGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCAC -TGCTTAAGCCTCAATAAAGCTTGCCT >OQ092466 GACGGCCGAGGTGGCTCTGGAAGGGCTAATTCACTCCCCAAAAAGACAAGAGATCCTTGA TCTGTGGGTCTATCATACACAAGGTTTCTTCCCTGATTGGGATAACTACACACCAGGGCC diff --git a/tests/expected-results-single/errors.json b/tests/expected-results-single/errors.json index c0fb715..abf6ec8 100644 --- a/tests/expected-results-single/errors.json +++ b/tests/expected-results-single/errors.json @@ -1,14 +1,3 @@ { - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 5 deletions 4." - }, - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - } - ] + "MN692145": [] } \ No newline at end of file diff --git a/tests/expected-results-single/intact.fasta b/tests/expected-results-single/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-single/intact.fasta +++ b/tests/expected-results-single/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-single/nonintact.fasta b/tests/expected-results-single/nonintact.fasta index 1f7afc5..e69de29 100644 --- a/tests/expected-results-single/nonintact.fasta +++ b/tests/expected-results-single/nonintact.fasta @@ -1,163 +0,0 @@ ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-small/errors.json b/tests/expected-results-small/errors.json index 5fd1d42..8e60474 100644 --- a/tests/expected-results-small/errors.json +++ b/tests/expected-results-small/errors.json @@ -20,11 +20,6 @@ "error": "DeletionInOrf", "message": "Smaller ORF tat_exon1 at 5829-6044 can have maximum deletions 30, got 213" }, - { - "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 0 deletions 212." - }, { "sequence_name": "KX505501.1", "error": "DeletionInOrf", @@ -32,13 +27,13 @@ }, { "sequence_name": "KX505501.1", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 0 deletions 73." + "error": "InternalStopInOrf", + "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon" }, { "sequence_name": "KX505501.1", - "error": "InternalStopInOrf", - "message": "Smaller ORF vpu at 6060-6309 contains an internal stop codon" + "error": "FrameshiftInOrf", + "message": "Smaller ORF tat_exon2 at 8375-8468 contains out of frame indels that impact 80 positions." }, { "sequence_name": "KX505501.1", @@ -67,16 +62,6 @@ } ], "MN691959": [ - { - "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 2 deletions 1." - }, - { - "sequence_name": "MN691959", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 3 deletions 1." - }, { "sequence_name": "MN691959", "error": "InternalStopInOrf", @@ -99,6 +84,11 @@ "error": "DeletionInOrf", "message": "Smaller ORF vif at 5040-5619 can have maximum deletions 30, got 81" }, + { + "sequence_name": "MN692074", + "error": "InsertionInOrf", + "message": "Smaller ORF vpr at 5558-5849 can have maximum insertions 90, got 207" + }, { "sequence_name": "MN692074", "error": "InternalStopInOrf", @@ -107,12 +97,17 @@ { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 1 deletions 153." + "message": "Smaller ORF rev_exon1 at 5968-6044 contains out of frame indels that impact 51 positions." + }, + { + "sequence_name": "MN692074", + "error": "InsertionInOrf", + "message": "Smaller ORF vpu at 6060-6309 can have maximum insertions 90, got 249" }, { "sequence_name": "MN692074", "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 18 deletions 31." + "message": "Smaller ORF tat_exon2 at 8375-8468 contains out of frame indels that impact 81 positions." }, { "sequence_name": "MN692074", @@ -135,18 +130,7 @@ "message": "Query sequence contains a long deletion." } ], - "MN692145": [ - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 5 deletions 4." - }, - { - "sequence_name": "MN692145", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 7 deletions 2." - } - ], + "MN692145": [], "MN090335": [ { "sequence_name": "MN090335", @@ -163,16 +147,6 @@ "error": "FrameshiftInOrf", "message": "ORF gag at 1175-2291 contains an out of frame indel, deletions 91 insertions 33." }, - { - "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF tat_exon1 at 5829-6044 contains an out of frame indel: insertions 7 deletions 6." - }, - { - "sequence_name": "MN090335", - "error": "FrameshiftInOrf", - "message": "Smaller ORF rev_exon1 at 5968-6044 contains an out of frame indel: insertions 4 deletions 2." - }, { "sequence_name": "MN090335", "error": "InternalStopInOrf", diff --git a/tests/expected-results-small/intact.fasta b/tests/expected-results-small/intact.fasta index e69de29..1f7afc5 100644 --- a/tests/expected-results-small/intact.fasta +++ b/tests/expected-results-small/intact.fasta @@ -0,0 +1,163 @@ +>MN692145 +TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA +CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC +TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA +GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT +GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT +ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG +AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT +GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC +TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG +TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG +TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG +AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC +GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG +TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG +GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA +ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG +ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT +AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA +TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC +AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT +GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA +GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA +AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA +AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC +TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC +CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA +TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT +TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA +AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT +GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC +ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT +CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA +TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC +CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA +AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA +GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG +CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA +ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA +AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA +GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT +ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG +ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT +GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA +GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA +ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT +CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA +GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA +CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA +TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT +ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA +GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA +AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA +ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT +ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC +CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC +AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC +AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA +CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA +CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA +GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT +GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA +ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA +AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG +GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA +GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA +GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT +CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC +ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA +TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA +TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT +GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA +TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA +GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA +GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG +GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA +CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT +ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG +ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG +AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA +GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC +AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA +AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT +TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT +AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG +ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT +AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA +TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT +GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG +AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA +CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT +ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC +TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC +TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG +AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT +AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG +GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT +TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT +GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC +TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA +AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA +CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT +ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC +TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA +TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT +ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG +CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA +CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG +CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA +CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA +GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA +ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG +GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG +AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA +ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA +AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA +AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT +GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG +AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC +AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG +TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG +CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT +TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG +AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC +TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG +GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA +AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT +TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC +CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA +GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA +AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA +TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC +AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG +TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC +AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT +GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG +AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC +AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT +GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG +GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC +AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC +CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA +AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC +GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT +GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA +GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA +TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG +GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA +TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA +GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT +GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT +CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA +GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA +TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG +GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC +AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA +GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG +CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG +GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG +CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG +GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT +GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC +CTTTTAGTCAGTGTGGAAAATCTCTAGCA diff --git a/tests/expected-results-small/nonintact.fasta b/tests/expected-results-small/nonintact.fasta index 94eb85d..1baa046 100644 --- a/tests/expected-results-small/nonintact.fasta +++ b/tests/expected-results-small/nonintact.fasta @@ -264,169 +264,6 @@ ACACAACAAATCAGAAGACTGAATTACAAGCAATTCATCTAGCTTTGCAGGATTCGGGAT TAGAAGTAAACATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAG ATACCCAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTC ->MN692145 -TGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTATGGATCTACCACA -CACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCAC -TGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGACAGAGAGAATGACA -GATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGAGAAGTGTTAGAGT -GGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTGCATCCGGAGTACT -ACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGGGACTTTCCAGGGG -AGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTGCATATAAGCAGCT -GCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGC -TGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTG -TGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTG -TGGAAAATCTCTAGCAGTGGCGCCCGAACAGGGACTTGAAAGCGAAAGAGAAACCAGAGG -AGATCTCTCGACGCAGGACTCGGCTTGCTGAAGCGCGCACAGCAAGAGGCGAGGGGCGGC -GACTGGTGAGTACGCCAAAAATTTTTTTTGACTAGCGGAGGCTAGAAGGAGAGAGATGGG -TGCGAGAGCGTCAGTATTAAGCGGGGGAAAATTAGATCAATGGGAGAAAATTCGGTTAAG -GCCAGGGGGAAAGAAAAAATATCAATTAAAACATATAGTATGGGCAAGCAAGGAACTAGA -ACGATTTGCAGTTAATCCTGGCCTGTTAGAAACAACAGAAGGATGTAGACAAATACTGGG -ACAGCTACAACCATCTCTTCAGACAGGATCAGAAGAACTTAAATCATTATATAATACAGT -AGCAACCCTCTATTGTGTGCATCAAAGGATAGATGTAAAAGACACCAAGGAAGCATTAGA -TAAGATAGAGGAAGAGCAAAACAAGAGTAAGGAAAAAGCAAAACAAGCAGCAGCTGACAC -AGGAAACAGCAACCAGGTCAGCCAAAATTACCCTATAGTGCAGAACCTTCAGGGCCAAAT -GGTACACCAGGCCATATCACCTAGAACTTTAAATGCATGGGTAAAAGTAATAGAAGAGAA -GGCTTTCAGCCCAGAAGTAATACCCATGTTTTCAGCATTATCAGAAGGAGCCACCCCACA -AGATTTAAACACCATGCTAAATACAGTGGGGGGACATCAAGCAGCCATGCAAATGTTAAA -AGAAACCATCAATGAGGAAGCTGCAGAATGGGATAGAGTGCATCCAGTGCATGCAGGGCC -TATTGCACCAGGCCAGATGAGAGAACCAAGGGGAAGTGACATAGCAGGAACCACTAGTAC -CCTTCAGGAACAAATAGGATGGATGACAAATAATCCACCTATCCCAGTAGGAGAAATCTA -TAAAAGATGGATAATCCTGGGATTAAATAAAATAGTAAGGATGTATAGTCCTACCAGCAT -TCTGGATATAAGACAAGGACCAAAAGAATCCTTTAGAGATTATGTAGACCGGTTCTACAA -AACTCTAAGAGCTGAGCAAGCCTCACAGGAGGTAAAAAATTGGATGACAGAAACCTTGTT -GGTCCAAAATTCAAACCCAGATTGTAAGACTATCTTAAAAGCATTGGGACCAGGAGCTAC -ACTAGAAGAAATGATGACAGCATGTCAGGGAGTGGGAGGACCCGGCCATAAAGCAAGAGT -CTTGGCTGAAGCAATGAGCCAAGTAACAAATTCAGCTACCATAATGATGCAGAGAGGCAA -TTTTAGGAGCCAAAGGAAGATTGTTAAGTGTTTCAATTGTGGCAAAGAGGGGCATATAGC -CAGAAATTGCAGGGCCCCTAGGAAAAAGGGCTGTTGGAAATGTGGAAAGGAAGGACACCA -AATGAAAGATTGTACTGAAAGACAGGCTAATTTTTTAGGGAAAATCTGGCCTTCCCACAA -GGGGAGGCCAGGAAATTTCCTTCAGAGCAGGCCAGAGCCAACAGCCCCACCAGAAGAGAG -CTTCAGGTTTGGGGAAGAGACAACAACTCCCTCTCAGAAGCAGGAGTCGACAGGCAAGGA -ACTGTATCCTCCTTTAGCTTCCCTCAGATCACTCTTTGGCAACGACCCCTCGTCACAATA -AAGATAGGGGGGCAACTAAAGGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTA -GAAGAAATGAGTTTACCAGGAAGATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTT -ATTAAAGTAAGACAGTATGATCAGATATCCATAGAAATCTGTGGACATAAAGCTATAGGG -ACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGAAGAAATCTGTTGACTCAAATT -GGTTGTACTTTAAATTTCCCCATTAGTCCTATTGAAACTGTACCAGTAAAATTAAAGCCA -GGAATGGATGGCCCAAAAGTTAAACAATGGCCATTGACAGAAGAAAAAATAAAAGCATTA -ACAGAAATTTGTACAGAAATGGAAAAGGAAGGGAAAATTTCAAAAATTGGGCCTGAAAAT -CCATACAATACTCCAGTATTTGCTATAAAGAAAAAAGACAGCACTAAATGGAGAAAATTA -GTAGATTTCAGAGAACTTAATAAAAGAACTCAAGATTTCTGGGAAGTTCAATTAGGGATA -CCACATCCAGCAGGGTTAAAAAAGAAAAAATCAGTAACAGTACTGGATGTGGGTGATGCA -TATTTTTCAGTTCCCTTAGATGAGGATTTCAGGAAGTATACTGCATTTACCATACCTAGT -ATAAACAATGAGACACCAGGGATTAGATATCAGTACAATGTGCTTCCACAGGGATGGAAA -GGATCACCAGCAATATTCCAATGTAGCATGACAAAAATCTTAGAGCCTTTTAGAAAACAA -AATCCAGACATAGTTATCTATCAATACATGGATGATTTGTATGTAGGATCTGACTTAGAA -ATAGGGCAGCATAGAACAAAAATAGAGGAATTGAGACAACATCTGTTGAGGTGGGGATTT -ACCACACCAGACAAAAAACATCAGAAAGAACCTCCATTCCTTTGGATGGGTTATGAACTC -CATCCTGATAAATGGACAGTACAGCCTATAGTGCTGCCAGAAAAAGAAAGCTGGACTGTC -AATGACATACAAAAGTTAGTGGGTAAATTGAATTGGGCAAGTCAGATTTATGCAGGGATC -AAAGTAAAACAATTATGTAAACTTCTTAGGGGAGCCAAAGCACTAACAGAAGTAATACCA -CTAACAGAAGAAGCAGAGCTAGAACTGGCAGAAAACAGGGAGATTTTAAAAGAACCAGTA -CATGGAGTGTATTATGACCCATCAAAAGACTTAATAGCAGAAATACAGAAGCAGGGGCAA -GGCCAATGGACATATCAGATTTATCAAGAGCCATTTAAAAATCTGAAAACAGGAAAATAT -GCAAGAGTGAGGGGTGCCCACACTAATGATGTAAAACAATTAACAGAGGCAGTGCAAAAA -ATAGCCACTGAAAGCATAGTAATATGGGGAAAGACTCCTAAATTTAGGTTACCCATACAA -AAAGAAACATGGGAAACATGGTGGACAGAGTATTGGCAAGCCACCTGGATTCCTGAGTGG -GAGTTTGTCAATACCCCTCCCTTAGTGAAATTATGGTACCAGTTAGAGAAAGAACCCATA -GTAGGAGCAGAAACTTTCTATGTAGATGGGGCATCTAATAGAGAGACTAAATTAGGAAAA -GCAGGATATGTTACTGACAGAGGAAGACAGAAAGTTGTCTCCCTAACTGACACAACAAAT -CAGAAGACTGAGTTACAAGCAATTCATCTAGCTTTGCAGGATTCAGGATTAGAAGTAAAC -ATAGTAACAGACTCACAATATGCATTAGGAATCATTCAAGCACAACCAGATAAAAGTGAA -TCAGAGTTAGTCAATCAAATAATAGAACAGTTAATAAACAAGGAAAAGGTCTACTTGGCA -TGGGTACCAGCACACAAAGGAATTGGAGGAAATGAACAAGTAGATAAATTAGTTAGTACT -GGAATTAGAAAAGTACTATTTTTAGATGGAATAGATAAGGCCCAAGAAGAACATGAGAAA -TACCACAGTAATTGGAGAGCAATGGCTAGTGATTTTAACCTGCCACCTGTGGTAGCAAGA -GAAATAGTAGCCAGCTGTGATAAATGTCAGCTAAAAGGAGAAGCCATGCATGGACAAGTA -GACTGTAGTCCAGGAATATGGCAGCTAGATTGTACACATTTAGAAGGAAAAGTTATCCTG -GTAGCAGTTCATGTAGCCAGTGGATATATAGAAGCAGAAGTTATTCCAGCAGAAACAGGA -CAGGAAACAGCATACTTTCTCTTAAAATTAGCAGGAAGATGGCCAGTAAAAACAATACAT -ACAGACAATGGCAGTAATTTCACTAGTACTACAGTTAAGGCCGCCTGTTGGTGGGCGGGG -ATCAAGCAGGAGTTTGGCATTCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATG -AATAAAGAATTAAAGAAAATTATAGGACAGGTAAGAGACCAGGCTGAACATCTTAAAACA -GCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTAC -AGTGCAGGGGAAAGAATAGTAGACATAATAGCAACAGACATACAAACTAAAGAATTACAA -AAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGATCCACTT -TGGAAAGGACCAGCAAAGCTTCTCTGGAAAGGTGAAGGGGCAGTAGTGATACAAGACAAT -AGTGACATAAAAGTAGTGCCAAGAAGAAAAGTAAAAATCATTAGGGATTATGGAAAACAG -ATGGCAGGTGATGATTGTGTGGCAAGTAGACAGGATGAGGATTAGAACATGGAAAAGTTT -AGTAAAACACCATATGTATGTTTCAGGGAAAGCTAAGGGATGGTTTTATAGACATCACTA -TGAAAGCCATCATCCAAGAATAAGTTCAGAAGTACATGTCCCACTAGGGGATGCTAGATT -GGTAATAACAACATATTGGGGTCTGCATACAGGAGAAAGAGATTGGCATTTGGGTCAGGG -AGTCTCCATAGAATGGAGGAAAAGGAGATATAGCACACAAGTAGACCCCAACCTAGCAGA -CCAACTGATTCATCTGTATTACTTTGATTGTTTTTCAGAATCTGCTATAAGAAGTGCCAT -ATTAGGACATATAGTTAGTCCTAGTTGTGAATATCAAGCAGGACATAACAAGGTAGGATC -TCTACAGTACTTGGCATTAGCAGCATTAATAACACCAAAAAGGAGAAAGCCCCCTTTGCC -TAGTGTTGCAAAGCTGACAGAGGATAGATGGAACAAGCCCCAGAAGACCAAGGGCCACCG -AGGGAGCCATATCAGGAATGGACACTAGAGCTTTTAGAGGAGCTTAAGAATGAAGCTGTT -AGACATTTTCCTAGGATGTGGCTCCATGGCTTAGGGCAACATATCTATGACACTTATGGG -GATACTTGGACAGGAGTGGAAGCCATAATAAGAATTCTGCAACAACTGCTGTTCATTCAT -TTCAGGATTGGGTGTCAACATAGCAGAATAGGCATTATTCGCCAGAGGAGAACAAGAAAT -GGAGCCAATAGATCCTAGACTAGAGCCCTGGAAGCATCCAGGAAGCCAGCCTAAGACTGC -TTGTACCTCTTGCTATTGTAAAAAGTGTTGCTTTCATTGTCAAGTCTGTTTCATGACAAA -AGCCTTAGGCATCTCCTATGGCAGGAAGAAGCGGAGACAGCGACGAAGAGCTTCTCAAGA -CAGTCAGACTCATCAAGTTTCTCTATCAAAGCAGTAAGTAGTACATGTAATGAACTCTTT -ACAAATATCAGCAATAGTAGCAATAGTAGTAGCAATAATACTAGCAATAGTTGTGTGGTC -TATAGTATTCATAGAATATAGGAAAATATTAAGACAAAGAAAAATAGATAGGTTAATTGA -TAGAATAAGAGAAAGAGCAGAAGACAGTGGCAATGAGAGTGAAGGGGATCAGGAAGAACT -ATCAACAGCACTTATGGAGATGGGGCACCATGCTCCTTGGGATGTTGATGATCTGTAGTG -CTGCAGGCAATTTGTGGGTCACAGTCTATTATGGGGTACCTGTGTGGAAAGAAGCAACCA -CCACTCTATTTTGTGCATCAGATGCTAAAGCATATGGTACAGAGGTACATAATGTTTGGG -CCACACATGCCTGTGTACCCACAGACCCCAACCCACAAGAAGTGAGATTGGAAAATGTGA -CAGAAAATTTTAATATGTGGAGAAATCCAATGGTAGAACAGATGCATGAGGATATAATTA -GTTTATGGGATCAAAGCCTAAAGCCATGTGTAAAGTTGACCCCACTCTGTGTCACTTTAA -ATTGCACTGATTTGGGACAGGAGAGTACCAATAATAATATCACAGGAAGTATAGAGAAAG -GAGAAATGAAAAACTGCTCTTTCAATATCTCCTCAAGCAAAGGAAGTAAGGGGCATAAAG -AATATGCATCTTTTTATAAACTTGATGTAGTACCAATAGGTAATAATAAGACTAATGGTA -ATTATTCTAGCTATAGGTTGATAAGTTGTAATACCTCAGTCATTACACAGGCCTGTCCAA -AAGTATCATTTGAGCCAATTCCCATACATTTTTGTGCCCCGGCTGGGTATGCGATTCTAA -AGTGTAATGATAAACAATTCAATGGAACAGGACCATGTACAAATGTCAGCACAGTACAGT -GTACACATGGAATTAGGCCAGTAGTATCAACTCAACTGCTGTTAAATGGTAGTCTAGCAG -AAGAAGAGGTAGTAATTAGATCTGCCAATTTCACGGACAATGCTAAAACCATAATAGTAC -AGCTGAACCAATCTGTAGAAATTACTTGTACAAGACCCGGTAACAATACAATAAGAGGGG -TTCACATGGGACCAGGGAAGGCATTTTATGCAGGAGCAATAACAGGAGATATAAGAAAAG -CACATTGTATCATTAATAAAGCAAAATGGAACAGTACTTTAAGACTGGTAGTTGCAAAAT -TAAGTGAGCAATTTAGGAATAAAACAATAAACTTTACTCAACCCTCAGGAGGGGACCCAG -AAATTGTAACACACAGTTTTAATTGTGGAGGGGAATTTTTCTACTGTAATACAACAAAAC -TGTTTAATAGTACTTGGAATGCAACACACATGATTAATGGTACTTGGAATGATACTGAGG -GAAATATCACCCTCCCATGCAGAATAAAACAAATTATAAACATGTGGCAGGAAGTAGGAA -AAGCAATGTATGCCCCTCCCATCAGAGGACAAATTAGATGTTCATCCAATATTACAGGGT -TGCTATTAACAAGAGATGGTGGTAAGACTAACGAGAGCAACACCACCGAGATCTTTAGAC -CTGGAGGAGGAGATATGAGAGACAATTGGAGAAGTGAATTATATAAATATAAAGTAGTAA -GAATTGAACCATTAGGGGTAGCACCCACCAAGGCAAAGAGAAGAGTGGTGCAGAGAGAAA -AAAGAGCAGTGGGAATAGGAGCTCTGTTCCTTGGGTTCTTGGGAGCAGCAGGAAGCACTA -TGGGCGCAACGTCGATGGCGTTGACGGTACAGGCCAGACAATTATTGTCTGGTATAGTGC -AACAGCAGAACAATTTGCTGAGAGCTATTGAGGCGCAACAACATTTGTTGCAACTCACAG -TCTGGGGCGTCAAGCAGCTCCAGGCAAGAGTCCTGGCTCTGGAAAGATACCTAAAGGATC -AACAGCTCCTGGGGTTTTGGGGTTGCTCTGGAAAACTCATTTGCACCACTGATGTGCCTT -GGAATGCTAGTTGGAGTAATAAATCTCTGGGACAAATTTGGGAGAACATGACCTGGATGG -AGTGGGAAAGAGAAATTGATAATTACACAAGCTTAATATACACTTTAATTACAGAATCGC -AGATCCAACAAGAACAGAATGAAAAAGAATTGTTGGAATTGGATAAATGGGCAAATTTGT -GGAATTGGTTTGGCATAACAAACTGGCTGTGGTACATAAAAATATTTATAATGATAGTAG -GAGGCTTAGTAGGTTTAAGAATAGTTTTTGCTGTACTTTCTATAGTGAATAGAGTTAGGC -AGGGATACTCACCATTATCGTTTCAGACCCGCTTCCCAGCCCCGAGGGGACCCGACAGGC -CCGAAGGAATCGAAGAAGAAGGTGGAGAGAGAGACAGAGACAGATCCGCTCCATTAGTGA -AAGGATTCTTAGCACTTATCTGGGTCGATCTACGGAGCCTGTGCCTCTTCAGCTACCACC -GCTTGAGAGACTTACTCTTGATAATAACGAGGATTGTGGAACTTCTGGGACGCAGGGGGT -GGGAAGTCCTCAAATACTTGTGGAGTCTCCTACAGTATTGGACACAGGAACTAAAGAATA -GTGCTGTTAGCTTGCTCAATGCCACAGCCATAGCAGTAGCTGAGGGGACAGATAGGATTA -TAGAAGTATTACAAAGAGTTTTTAGAGCTATCCTCCATATCCCTACAAGAATAAGACAGG -GCTTTGAAAGGGCTTTGCTATAAGATGGGGGGCAAGTGGTCAAAAAGTAGTTTGGTTGGA -TGGCCTAATGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATGGGGTGGGAGCA -GTATCTCGAGACTTGGAAAGACATGGAGCAATCACAAGTAGTAATACAGCAACTAACAAT -GCTGATTGTGCCTGGCTAGAAGCACAAAAGGAGGAGGAGGTGGGTTTTCCAGTCACACCT -CAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAA -GAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAAAAGACAAGATATTCTTGATCTA -TGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGG -GTCAGATATCCACTGACCTTTGGATGGTGCTTCAAGCTAGTACCAGTTGAGCCCACTGAC -AGAGAGAATGACAGATTGCTGCACCCTGCAAGCCTGCAGGGGATGGAAGACCCGGAGGGA -GAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTGGCATTTCATCACATGGCCCGAGAGCTG -CATCCGGAGTACTACAAGAACTGCTGACATCGAGCTTTCTACAAGGGACTTTCCGCTGGG -GACTTTCCAGGGGAGGCGTGGCCTGGGCGGGGCAGGGGAGTGGCGAGCCCTCAGATGCTG -CATATAAGCAGCTGCTTCTGCCTGTACTGGGTCTCTCTGGTTAGACCAGATCTGAGCCTG -GGAGCTCTCTGGCTGACTAGGGAACCCACTGCTTAAGCCTCAATAAAGCTTGCCTTGAGT -GCTTCAAGTAGTGTGTGCCCGTCTGTTGTGTGACTCTGGTAACTAGAGATCCCTCAGACC -CTTTTAGTCAGTGTGGAAAATCTCTAGCA >MN090335 GGACCTGAAAGCGAAAGTAGAACCAGAGAAGATCTCTCGACGCAGGGCTCCTTCTGATAA TGCTGAAAACATGGGTATTACTTCTGGGCTGAAAGCCTTTTCTTCTACTACTTTTACCCA